diff --git a/latest/CODE_OF_CONDUCT.html b/latest/CODE_OF_CONDUCT.html
index 28971c139..80826f485 100644
--- a/latest/CODE_OF_CONDUCT.html
+++ b/latest/CODE_OF_CONDUCT.html
@@ -4,7 +4,7 @@
   <meta charset="utf-8" /><meta name="viewport" content="width=device-width, initial-scale=1" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-  <title>Contributor Covenant Code of Conduct &mdash; Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation</title>
+  <title>Contributor Covenant Code of Conduct &mdash; Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation</title>
       <link rel="stylesheet" type="text/css" href="_static/pygments.css?v=fa44fd50" />
       <link rel="stylesheet" type="text/css" href="_static/css/theme.css?v=19f00094" />
       <link rel="stylesheet" type="text/css" href="_static/custom.css?v=439db15d" />
@@ -225,7 +225,7 @@ <h2>Attribution<a class="headerlink" href="#attribution" title="Link to this hea
   Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
     <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
     provided by <a href="https://readthedocs.org">Read the Docs</a>.
-   <jinja2.runtime.BlockReference object at 0x7f4a4a115810> 
+   <jinja2.runtime.BlockReference object at 0x7f124cd560e0> 
   <p></p><div><a href='https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html' data-cookie-notice='true'>Cookies</a> <a href='https://www.intel.com/content/www/us/en/privacy/intel-privacy-notice.html'>| Privacy</a></div>
 
 
diff --git a/latest/SECURITY.html b/latest/SECURITY.html
index 6e37733c4..230ac2f38 100644
--- a/latest/SECURITY.html
+++ b/latest/SECURITY.html
@@ -4,7 +4,7 @@
   <meta charset="utf-8" /><meta name="viewport" content="width=device-width, initial-scale=1" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-  <title>Security Policy &mdash; Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation</title>
+  <title>Security Policy &mdash; Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation</title>
       <link rel="stylesheet" type="text/css" href="_static/pygments.css?v=fa44fd50" />
       <link rel="stylesheet" type="text/css" href="_static/css/theme.css?v=19f00094" />
       <link rel="stylesheet" type="text/css" href="_static/custom.css?v=439db15d" />
@@ -120,7 +120,7 @@ <h2>Report a Vulnerability<a class="headerlink" href="#report-a-vulnerability" t
   Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
     <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
     provided by <a href="https://readthedocs.org">Read the Docs</a>.
-   <jinja2.runtime.BlockReference object at 0x7f4a4a03fa60> 
+   <jinja2.runtime.BlockReference object at 0x7f124cd8fe50> 
   <p></p><div><a href='https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html' data-cookie-notice='true'>Cookies</a> <a href='https://www.intel.com/content/www/us/en/privacy/intel-privacy-notice.html'>| Privacy</a></div>
 
 
diff --git a/latest/_sources/docs/community/contributing.md.txt b/latest/_sources/docs/community/contributing.md.txt
index 7a5102849..faffe40a9 100644
--- a/latest/_sources/docs/community/contributing.md.txt
+++ b/latest/_sources/docs/community/contributing.md.txt
@@ -116,8 +116,8 @@ To check bazel files manually:
 
 ```bash
 # install go
-wget https://golang.org/dl/go1.15.3.linux-.html64.tar.gz
-sudo tar -C /usr/local -xzf go1.15.3.linux-.html64.tar.gz
+wget https://golang.org/dl/go1.15.3.linux-amd64.tar.gz
+sudo tar -C /usr/local -xzf go1.15.3.linux-amd64.tar.gz
 export PATH=$PATH:/usr/local/go/bin
 
 # install buildifier
diff --git a/latest/_sources/docs/design/how_to_write_custom_op.md.txt b/latest/_sources/docs/design/how_to_write_custom_op.md.txt
index 8d3d04248..05626fb31 100644
--- a/latest/_sources/docs/design/how_to_write_custom_op.md.txt
+++ b/latest/_sources/docs/design/how_to_write_custom_op.md.txt
@@ -130,7 +130,7 @@ class EltwiseBaseOp : public OpKernel {
       }
       ......
       // Create an eltwise forward descriptor and primitive descriptor
-      eltwise_forward::desc fwd_desc(prop_kind::forward, alg_kind_, src.html,
+      eltwise_forward::desc fwd_desc(prop_kind::forward, alg_kind_, src_md,
                                      alpha_, beta_);
       dnnl::primitive_attr attr;
       attr.set_scratchpad_mode(dnnl::scratchpad_mode::user);
diff --git a/latest/_sources/docs/install/experimental/install_for_arc_gpu.md.txt b/latest/_sources/docs/install/experimental/install_for_arc_gpu.md.txt
index a3d3297b6..de35ba936 100644
--- a/latest/_sources/docs/install/experimental/install_for_arc_gpu.md.txt
+++ b/latest/_sources/docs/install/experimental/install_for_arc_gpu.md.txt
@@ -72,7 +72,7 @@ The steps to install the runtime components in Ubuntu Linux (within WSL2) are:
     sudo apt-get install -y gpg-agent wget
     wget -qO - https://repositories.intel.com/gpu/intel-graphics.key | 
     sudo gpg --dearmor --output /usr/share/keyrings/intel-graphics.gpg
-    echo "deb [arch=.html64 signed-by=/usr/share/keyrings/intel-graphics.gpg] https://repositories.intel.com/gpu/ubuntu jammy/lts/2350 unified" | sudo tee /etc/apt/sources.list.d/intel-gpu-jammy.list
+    echo "deb [arch=amd64 signed-by=/usr/share/keyrings/intel-graphics.gpg] https://repositories.intel.com/gpu/ubuntu jammy/lts/2350 unified" | sudo tee /etc/apt/sources.list.d/intel-gpu-jammy.list
     sudo apt-get update
     ```
 
@@ -122,7 +122,7 @@ The steps to install the runtime components in Ubuntu Linux are:
     sudo apt-get install -y gpg-agent wget
     wget -qO - https://repositories.intel.com/gpu/intel-graphics.key | 
     sudo gpg --dearmor --output /usr/share/keyrings/intel-graphics.gpg
-    echo "deb [arch=.html64 signed-by=/usr/share/keyrings/intel-graphics.gpg] https://repositories.intel.com/gpu/ubuntu jammy/lts/2350 unified" | sudo tee /etc/apt/sources.list.d/intel-gpu-jammy.list
+    echo "deb [arch=amd64 signed-by=/usr/share/keyrings/intel-graphics.gpg] https://repositories.intel.com/gpu/ubuntu jammy/lts/2350 unified" | sudo tee /etc/apt/sources.list.d/intel-gpu-jammy.list
     sudo apt-get update
     ```
 
diff --git a/latest/_static/documentation_options.js b/latest/_static/documentation_options.js
index e6c0d9379..4bcfb6d68 100644
--- a/latest/_static/documentation_options.js
+++ b/latest/_static/documentation_options.js
@@ -1,5 +1,5 @@
 const DOCUMENTATION_OPTIONS = {
-    VERSION: '0.1.dev1+gc09a994',
+    VERSION: '0.1.dev1+g26e99fc',
     LANGUAGE: 'en',
     COLLAPSE_INDEX: false,
     BUILDER: 'html',
diff --git a/latest/docker/README.html b/latest/docker/README.html
index e9ece2143..c1c4c162b 100644
--- a/latest/docker/README.html
+++ b/latest/docker/README.html
@@ -4,7 +4,7 @@
   <meta charset="utf-8" /><meta name="viewport" content="width=device-width, initial-scale=1" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-  <title>Intel® Extension for TensorFlow* Docker Container Guide &mdash; Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation</title>
+  <title>Intel® Extension for TensorFlow* Docker Container Guide &mdash; Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation</title>
       <link rel="stylesheet" type="text/css" href="../_static/pygments.css?v=fa44fd50" />
       <link rel="stylesheet" type="text/css" href="../_static/css/theme.css?v=19f00094" />
       <link rel="stylesheet" type="text/css" href="../_static/custom.css?v=439db15d" />
@@ -213,7 +213,7 @@ <h2>Verify That Intel GPU is Accessible From TensorFlow<a class="headerlink" hre
   Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
     <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
     provided by <a href="https://readthedocs.org">Read the Docs</a>.
-   <jinja2.runtime.BlockReference object at 0x7f4a4a03cb20> 
+   <jinja2.runtime.BlockReference object at 0x7f124cd8e620> 
   <p></p><div><a href='https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html' data-cookie-notice='true'>Cookies</a> <a href='https://www.intel.com/content/www/us/en/privacy/intel-privacy-notice.html'>| Privacy</a></div>
 
 
diff --git a/latest/docker/tensorflow-serving/README.html b/latest/docker/tensorflow-serving/README.html
index 0142b97fa..d83c89a6b 100644
--- a/latest/docker/tensorflow-serving/README.html
+++ b/latest/docker/tensorflow-serving/README.html
@@ -4,7 +4,7 @@
   <meta charset="utf-8" /><meta name="viewport" content="width=device-width, initial-scale=1" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-  <title>Intel® Extension for TensorFlow* Serving - Docker Container Guide &mdash; Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation</title>
+  <title>Intel® Extension for TensorFlow* Serving - Docker Container Guide &mdash; Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation</title>
       <link rel="stylesheet" type="text/css" href="../../_static/pygments.css?v=fa44fd50" />
       <link rel="stylesheet" type="text/css" href="../../_static/css/theme.css?v=19f00094" />
       <link rel="stylesheet" type="text/css" href="../../_static/custom.css?v=439db15d" />
@@ -169,7 +169,7 @@ <h2>Running the Container<a class="headerlink" href="#running-the-container" tit
   Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
     <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
     provided by <a href="https://readthedocs.org">Read the Docs</a>.
-   <jinja2.runtime.BlockReference object at 0x7f4a4a0d1ea0> 
+   <jinja2.runtime.BlockReference object at 0x7f124cd7bdc0> 
   <p></p><div><a href='https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html' data-cookie-notice='true'>Cookies</a> <a href='https://www.intel.com/content/www/us/en/privacy/intel-privacy-notice.html'>| Privacy</a></div>
 
 
diff --git a/latest/docs/README.html b/latest/docs/README.html
index f3da94eef..2e882c24d 100644
--- a/latest/docs/README.html
+++ b/latest/docs/README.html
@@ -4,7 +4,7 @@
   <meta charset="utf-8" /><meta name="viewport" content="width=device-width, initial-scale=1" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-  <title>Welcome to Intel® Extension for TensorFlow* documentation &mdash; Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation</title>
+  <title>Welcome to Intel® Extension for TensorFlow* documentation &mdash; Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation</title>
       <link rel="stylesheet" type="text/css" href="../_static/pygments.css?v=fa44fd50" />
       <link rel="stylesheet" type="text/css" href="../_static/css/theme.css?v=19f00094" />
       <link rel="stylesheet" type="text/css" href="../_static/custom.css?v=439db15d" />
@@ -234,7 +234,7 @@ <h2>Highlights<a class="headerlink" href="#highlights" title="Link to this headi
   Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
     <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
     provided by <a href="https://readthedocs.org">Read the Docs</a>.
-   <jinja2.runtime.BlockReference object at 0x7f4a4a0d19f0> 
+   <jinja2.runtime.BlockReference object at 0x7f124cd787c0> 
   <p></p><div><a href='https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html' data-cookie-notice='true'>Cookies</a> <a href='https://www.intel.com/content/www/us/en/privacy/intel-privacy-notice.html'>| Privacy</a></div>
 
 
diff --git a/latest/docs/build_docs/docs_build_tips.html b/latest/docs/build_docs/docs_build_tips.html
index 58622d364..966b2418e 100644
--- a/latest/docs/build_docs/docs_build_tips.html
+++ b/latest/docs/build_docs/docs_build_tips.html
@@ -4,7 +4,7 @@
   <meta charset="utf-8" /><meta name="viewport" content="width=device-width, initial-scale=1" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-  <title>Online Documentation Build Guide &mdash; Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation</title>
+  <title>Online Documentation Build Guide &mdash; Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation</title>
       <link rel="stylesheet" type="text/css" href="../../_static/pygments.css?v=fa44fd50" />
       <link rel="stylesheet" type="text/css" href="../../_static/css/theme.css?v=19f00094" />
       <link rel="stylesheet" type="text/css" href="../../_static/custom.css?v=439db15d" />
@@ -161,7 +161,7 @@ <h2>Build to Local Test<a class="headerlink" href="#build-to-local-test" title="
   Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
     <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
     provided by <a href="https://readthedocs.org">Read the Docs</a>.
-   <jinja2.runtime.BlockReference object at 0x7f4a4a0d27d0> 
+   <jinja2.runtime.BlockReference object at 0x7f124cd7aaa0> 
   <p></p><div><a href='https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html' data-cookie-notice='true'>Cookies</a> <a href='https://www.intel.com/content/www/us/en/privacy/intel-privacy-notice.html'>| Privacy</a></div>
 
 
diff --git a/latest/docs/build_docs/source/index.html b/latest/docs/build_docs/source/index.html
index 012c15b83..8ed8cd38d 100644
--- a/latest/docs/build_docs/source/index.html
+++ b/latest/docs/build_docs/source/index.html
@@ -4,7 +4,7 @@
   <meta charset="utf-8" /><meta name="viewport" content="width=device-width, initial-scale=1" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-  <title>Welcome to Intel ® Extension for TensorFlow* documentation! &mdash; Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation</title>
+  <title>Welcome to Intel ® Extension for TensorFlow* documentation! &mdash; Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation</title>
       <link rel="stylesheet" type="text/css" href="../../../_static/pygments.css?v=fa44fd50" />
       <link rel="stylesheet" type="text/css" href="../../../_static/css/theme.css?v=19f00094" />
       <link rel="stylesheet" type="text/css" href="../../../_static/custom.css?v=439db15d" />
@@ -110,7 +110,7 @@ <h1>Welcome to Intel ® Extension for TensorFlow* documentation!<a class="header
   Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
     <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
     provided by <a href="https://readthedocs.org">Read the Docs</a>.
-   <jinja2.runtime.BlockReference object at 0x7f4a4a0d3f10> 
+   <jinja2.runtime.BlockReference object at 0x7f124cd78fa0> 
   <p></p><div><a href='https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html' data-cookie-notice='true'>Cookies</a> <a href='https://www.intel.com/content/www/us/en/privacy/intel-privacy-notice.html'>| Privacy</a></div>
 
 
diff --git a/latest/docs/community/contributing.html b/latest/docs/community/contributing.html
index e8443acb3..ff90cfbd6 100644
--- a/latest/docs/community/contributing.html
+++ b/latest/docs/community/contributing.html
@@ -4,7 +4,7 @@
   <meta charset="utf-8" /><meta name="viewport" content="width=device-width, initial-scale=1" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-  <title>Contributing guidelines &mdash; Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation</title>
+  <title>Contributing guidelines &mdash; Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation</title>
       <link rel="stylesheet" type="text/css" href="../../_static/pygments.css?v=fa44fd50" />
       <link rel="stylesheet" type="text/css" href="../../_static/css/theme.css?v=19f00094" />
       <link rel="stylesheet" type="text/css" href="../../_static/custom.css?v=439db15d" />
@@ -221,8 +221,8 @@ <h3>bazel style guide<a class="headerlink" href="#bazel-style-guide" title="Link
 <p><a class="reference external" href="https://github.com/bazelbuild/buildtools/tree/master/buildifier">buildifier</a> is a tool for formatting bazel <code class="docutils literal notranslate"><span class="pre">BUILD</span></code> and <code class="docutils literal notranslate"><span class="pre">.bzl</span></code> files with a standard convention (<code class="docutils literal notranslate"><span class="pre">xxx.tpl</span></code> files are not supported).</p>
 <p>To check bazel files manually:</p>
 <div class="highlight-bash notranslate"><div class="highlight"><pre><span></span><span class="c1"># install go</span>
-wget<span class="w"> </span>https://golang.org/dl/go1.15.3.linux-.html64.tar.gz
-sudo<span class="w"> </span>tar<span class="w"> </span>-C<span class="w"> </span>/usr/local<span class="w"> </span>-xzf<span class="w"> </span>go1.15.3.linux-.html64.tar.gz
+wget<span class="w"> </span>https://golang.org/dl/go1.15.3.linux-amd64.tar.gz
+sudo<span class="w"> </span>tar<span class="w"> </span>-C<span class="w"> </span>/usr/local<span class="w"> </span>-xzf<span class="w"> </span>go1.15.3.linux-amd64.tar.gz
 <span class="nb">export</span><span class="w"> </span><span class="nv">PATH</span><span class="o">=</span><span class="nv">$PATH</span>:/usr/local/go/bin
 
 <span class="c1"># install buildifier</span>
@@ -260,7 +260,7 @@ <h3>Documentation style guide<a class="headerlink" href="#documentation-style-gu
   Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
     <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
     provided by <a href="https://readthedocs.org">Read the Docs</a>.
-   <jinja2.runtime.BlockReference object at 0x7f4a4a0d2a10> 
+   <jinja2.runtime.BlockReference object at 0x7f124cd8e380> 
   <p></p><div><a href='https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html' data-cookie-notice='true'>Cookies</a> <a href='https://www.intel.com/content/www/us/en/privacy/intel-privacy-notice.html'>| Privacy</a></div>
 
 
diff --git a/latest/docs/community/releases.html b/latest/docs/community/releases.html
index 11d546c54..36b2dec32 100644
--- a/latest/docs/community/releases.html
+++ b/latest/docs/community/releases.html
@@ -4,7 +4,7 @@
   <meta charset="utf-8" /><meta name="viewport" content="width=device-width, initial-scale=1" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-  <title>Releases &mdash; Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation</title>
+  <title>Releases &mdash; Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation</title>
       <link rel="stylesheet" type="text/css" href="../../_static/pygments.css?v=fa44fd50" />
       <link rel="stylesheet" type="text/css" href="../../_static/css/theme.css?v=19f00094" />
       <link rel="stylesheet" type="text/css" href="../../_static/custom.css?v=439db15d" />
@@ -130,7 +130,7 @@ <h2>Incompatible Changes<a class="headerlink" href="#incompatible-changes" title
   Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
     <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
     provided by <a href="https://readthedocs.org">Read the Docs</a>.
-   <jinja2.runtime.BlockReference object at 0x7f4a4a0f7580> 
+   <jinja2.runtime.BlockReference object at 0x7f124cd552a0> 
   <p></p><div><a href='https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html' data-cookie-notice='true'>Cookies</a> <a href='https://www.intel.com/content/www/us/en/privacy/intel-privacy-notice.html'>| Privacy</a></div>
 
 
diff --git a/latest/docs/design/directory_structure.html b/latest/docs/design/directory_structure.html
index e754aedfb..ac916d806 100644
--- a/latest/docs/design/directory_structure.html
+++ b/latest/docs/design/directory_structure.html
@@ -4,7 +4,7 @@
   <meta charset="utf-8" /><meta name="viewport" content="width=device-width, initial-scale=1" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-  <title>Directory Tree Structure &mdash; Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation</title>
+  <title>Directory Tree Structure &mdash; Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation</title>
       <link rel="stylesheet" type="text/css" href="../../_static/pygments.css?v=fa44fd50" />
       <link rel="stylesheet" type="text/css" href="../../_static/css/theme.css?v=19f00094" />
       <link rel="stylesheet" type="text/css" href="../../_static/custom.css?v=439db15d" />
@@ -186,7 +186,7 @@ <h1>Directory Tree Structure<a class="headerlink" href="#directory-tree-structur
   Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
     <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
     provided by <a href="https://readthedocs.org">Read the Docs</a>.
-   <jinja2.runtime.BlockReference object at 0x7f4a4a82cbb0> 
+   <jinja2.runtime.BlockReference object at 0x7f124cd55f30> 
   <p></p><div><a href='https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html' data-cookie-notice='true'>Cookies</a> <a href='https://www.intel.com/content/www/us/en/privacy/intel-privacy-notice.html'>| Privacy</a></div>
 
 
diff --git a/latest/docs/design/extension_design.html b/latest/docs/design/extension_design.html
index 6251c5069..27ed1ca48 100644
--- a/latest/docs/design/extension_design.html
+++ b/latest/docs/design/extension_design.html
@@ -4,7 +4,7 @@
   <meta charset="utf-8" /><meta name="viewport" content="width=device-width, initial-scale=1" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-  <title>Extension Design &mdash; Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation</title>
+  <title>Extension Design &mdash; Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation</title>
       <link rel="stylesheet" type="text/css" href="../../_static/pygments.css?v=fa44fd50" />
       <link rel="stylesheet" type="text/css" href="../../_static/css/theme.css?v=19f00094" />
       <link rel="stylesheet" type="text/css" href="../../_static/custom.css?v=439db15d" />
@@ -124,7 +124,7 @@ <h2>Resources<a class="headerlink" href="#resources" title="Link to this heading
   Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
     <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
     provided by <a href="https://readthedocs.org">Read the Docs</a>.
-   <jinja2.runtime.BlockReference object at 0x7f4a4a115c30> 
+   <jinja2.runtime.BlockReference object at 0x7f124ccd0850> 
   <p></p><div><a href='https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html' data-cookie-notice='true'>Cookies</a> <a href='https://www.intel.com/content/www/us/en/privacy/intel-privacy-notice.html'>| Privacy</a></div>
 
 
diff --git a/latest/docs/design/how_to_write_custom_op.html b/latest/docs/design/how_to_write_custom_op.html
index 96e714f18..35fc31559 100644
--- a/latest/docs/design/how_to_write_custom_op.html
+++ b/latest/docs/design/how_to_write_custom_op.html
@@ -4,7 +4,7 @@
   <meta charset="utf-8" /><meta name="viewport" content="width=device-width, initial-scale=1" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-  <title>How to write custom op &mdash; Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation</title>
+  <title>How to write custom op &mdash; Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation</title>
       <link rel="stylesheet" type="text/css" href="../../_static/pygments.css?v=fa44fd50" />
       <link rel="stylesheet" type="text/css" href="../../_static/css/theme.css?v=19f00094" />
       <link rel="stylesheet" type="text/css" href="../../_static/custom.css?v=439db15d" />
@@ -232,7 +232,7 @@ <h2>4.  Implement the kernels<a class="headerlink" href="#implement-the-kernels"
 <span class="w">      </span><span class="p">}</span>
 <span class="w">      </span><span class="p">......</span>
 <span class="w">      </span><span class="c1">// Create an eltwise forward descriptor and primitive descriptor</span>
-<span class="w">      </span><span class="n">eltwise_forward</span><span class="o">::</span><span class="n">desc</span><span class="w"> </span><span class="n">fwd_desc</span><span class="p">(</span><span class="n">prop_kind</span><span class="o">::</span><span class="n">forward</span><span class="p">,</span><span class="w"> </span><span class="n">alg_kind_</span><span class="p">,</span><span class="w"> </span><span class="n">src</span><span class="p">.</span><span class="n">html</span><span class="p">,</span>
+<span class="w">      </span><span class="n">eltwise_forward</span><span class="o">::</span><span class="n">desc</span><span class="w"> </span><span class="n">fwd_desc</span><span class="p">(</span><span class="n">prop_kind</span><span class="o">::</span><span class="n">forward</span><span class="p">,</span><span class="w"> </span><span class="n">alg_kind_</span><span class="p">,</span><span class="w"> </span><span class="n">src_md</span><span class="p">,</span>
 <span class="w">                                     </span><span class="n">alpha_</span><span class="p">,</span><span class="w"> </span><span class="n">beta_</span><span class="p">);</span>
 <span class="w">      </span><span class="n">dnnl</span><span class="o">::</span><span class="n">primitive_attr</span><span class="w"> </span><span class="n">attr</span><span class="p">;</span>
 <span class="w">      </span><span class="n">attr</span><span class="p">.</span><span class="n">set_scratchpad_mode</span><span class="p">(</span><span class="n">dnnl</span><span class="o">::</span><span class="n">scratchpad_mode</span><span class="o">::</span><span class="n">user</span><span class="p">);</span>
@@ -381,7 +381,7 @@ <h2>9.  Install and Verify<a class="headerlink" href="#install-and-verify" title
   Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
     <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
     provided by <a href="https://readthedocs.org">Read the Docs</a>.
-   <jinja2.runtime.BlockReference object at 0x7f4a4a0f4d00> 
+   <jinja2.runtime.BlockReference object at 0x7f124cd555a0> 
   <p></p><div><a href='https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html' data-cookie-notice='true'>Cookies</a> <a href='https://www.intel.com/content/www/us/en/privacy/intel-privacy-notice.html'>| Privacy</a></div>
 
 
diff --git a/latest/docs/design/optimization/README.html b/latest/docs/design/optimization/README.html
index 11faf1ee1..83b06b9d6 100644
--- a/latest/docs/design/optimization/README.html
+++ b/latest/docs/design/optimization/README.html
@@ -4,7 +4,7 @@
   <meta charset="utf-8" /><meta name="viewport" content="width=device-width, initial-scale=1" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-  <title>Optimizations Design &mdash; Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation</title>
+  <title>Optimizations Design &mdash; Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation</title>
       <link rel="stylesheet" type="text/css" href="../../../_static/pygments.css?v=fa44fd50" />
       <link rel="stylesheet" type="text/css" href="../../../_static/css/theme.css?v=19f00094" />
       <link rel="stylesheet" type="text/css" href="../../../_static/custom.css?v=439db15d" />
@@ -109,7 +109,7 @@ <h1>Optimizations Design<a class="headerlink" href="#optimizations-design" title
   Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
     <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
     provided by <a href="https://readthedocs.org">Read the Docs</a>.
-   <jinja2.runtime.BlockReference object at 0x7f4a4a0d0550> 
+   <jinja2.runtime.BlockReference object at 0x7f124cd7a260> 
   <p></p><div><a href='https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html' data-cookie-notice='true'>Cookies</a> <a href='https://www.intel.com/content/www/us/en/privacy/intel-privacy-notice.html'>| Privacy</a></div>
 
 
diff --git a/latest/docs/design/optimization/oneDNN_object_cache.html b/latest/docs/design/optimization/oneDNN_object_cache.html
index 63ce24afe..8f40a54b2 100644
--- a/latest/docs/design/optimization/oneDNN_object_cache.html
+++ b/latest/docs/design/optimization/oneDNN_object_cache.html
@@ -4,7 +4,7 @@
   <meta charset="utf-8" /><meta name="viewport" content="width=device-width, initial-scale=1" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-  <title>oneDNN object cache optimization &mdash; Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation</title>
+  <title>oneDNN object cache optimization &mdash; Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation</title>
       <link rel="stylesheet" type="text/css" href="../../../_static/pygments.css?v=fa44fd50" />
       <link rel="stylesheet" type="text/css" href="../../../_static/css/theme.css?v=19f00094" />
       <link rel="stylesheet" type="text/css" href="../../../_static/custom.css?v=439db15d" />
@@ -130,7 +130,7 @@ <h2>Optimization in convolution<a class="headerlink" href="#optimization-in-conv
   Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
     <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
     provided by <a href="https://readthedocs.org">Read the Docs</a>.
-   <jinja2.runtime.BlockReference object at 0x7f4a4a0d1f90> 
+   <jinja2.runtime.BlockReference object at 0x7f124cd78c70> 
   <p></p><div><a href='https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html' data-cookie-notice='true'>Cookies</a> <a href='https://www.intel.com/content/www/us/en/privacy/intel-privacy-notice.html'>| Privacy</a></div>
 
 
diff --git a/latest/docs/guide/FAQ.html b/latest/docs/guide/FAQ.html
index aae9575d8..b49e4dbad 100644
--- a/latest/docs/guide/FAQ.html
+++ b/latest/docs/guide/FAQ.html
@@ -4,7 +4,7 @@
   <meta charset="utf-8" /><meta name="viewport" content="width=device-width, initial-scale=1" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-  <title>Frequently Asked Questions &mdash; Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation</title>
+  <title>Frequently Asked Questions &mdash; Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation</title>
       <link rel="stylesheet" type="text/css" href="../../_static/pygments.css?v=fa44fd50" />
       <link rel="stylesheet" type="text/css" href="../../_static/css/theme.css?v=19f00094" />
       <link rel="stylesheet" type="text/css" href="../../_static/custom.css?v=439db15d" />
@@ -206,7 +206,7 @@ <h3>Runtime<a class="headerlink" href="#runtime" title="Link to this heading">
   Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
     <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
     provided by <a href="https://readthedocs.org">Read the Docs</a>.
-   <jinja2.runtime.BlockReference object at 0x7f4a4a116920> 
+   <jinja2.runtime.BlockReference object at 0x7f124ccd0be0> 
   <p></p><div><a href='https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html' data-cookie-notice='true'>Cookies</a> <a href='https://www.intel.com/content/www/us/en/privacy/intel-privacy-notice.html'>| Privacy</a></div>
 
 
diff --git a/latest/docs/guide/INT8_quantization.html b/latest/docs/guide/INT8_quantization.html
index 79b6a57cf..37400e6e0 100644
--- a/latest/docs/guide/INT8_quantization.html
+++ b/latest/docs/guide/INT8_quantization.html
@@ -4,7 +4,7 @@
   <meta charset="utf-8" /><meta name="viewport" content="width=device-width, initial-scale=1" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-  <title>INT8 Quantization &mdash; Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation</title>
+  <title>INT8 Quantization &mdash; Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation</title>
       <link rel="stylesheet" type="text/css" href="../../_static/pygments.css?v=fa44fd50" />
       <link rel="stylesheet" type="text/css" href="../../_static/css/theme.css?v=19f00094" />
       <link rel="stylesheet" type="text/css" href="../../_static/custom.css?v=439db15d" />
@@ -159,7 +159,7 @@ <h2>Usage<a class="headerlink" href="#usage" title="Link to this heading"></a
   Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
     <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
     provided by <a href="https://readthedocs.org">Read the Docs</a>.
-   <jinja2.runtime.BlockReference object at 0x7f4a4a0d03a0> 
+   <jinja2.runtime.BlockReference object at 0x7f124cd7ba00> 
   <p></p><div><a href='https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html' data-cookie-notice='true'>Cookies</a> <a href='https://www.intel.com/content/www/us/en/privacy/intel-privacy-notice.html'>| Privacy</a></div>
 
 
diff --git a/latest/docs/guide/OpenXLA.html b/latest/docs/guide/OpenXLA.html
index de7465dc7..7d6b6531c 100644
--- a/latest/docs/guide/OpenXLA.html
+++ b/latest/docs/guide/OpenXLA.html
@@ -4,7 +4,7 @@
   <meta charset="utf-8" /><meta name="viewport" content="width=device-width, initial-scale=1" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-  <title>OpenXLA &mdash; Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation</title>
+  <title>OpenXLA &mdash; Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation</title>
       <link rel="stylesheet" type="text/css" href="../../_static/pygments.css?v=fa44fd50" />
       <link rel="stylesheet" type="text/css" href="../../_static/css/theme.css?v=19f00094" />
       <link rel="stylesheet" type="text/css" href="../../_static/custom.css?v=439db15d" />
@@ -212,7 +212,7 @@ <h2>References<a class="headerlink" href="#references" title="Link to this headi
   Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
     <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
     provided by <a href="https://readthedocs.org">Read the Docs</a>.
-   <jinja2.runtime.BlockReference object at 0x7f4a4a0f5750> 
+   <jinja2.runtime.BlockReference object at 0x7f124cd56320> 
   <p></p><div><a href='https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html' data-cookie-notice='true'>Cookies</a> <a href='https://www.intel.com/content/www/us/en/privacy/intel-privacy-notice.html'>| Privacy</a></div>
 
 
diff --git a/latest/docs/guide/XPUAutoShard.html b/latest/docs/guide/XPUAutoShard.html
index 869527655..ec81a7d39 100644
--- a/latest/docs/guide/XPUAutoShard.html
+++ b/latest/docs/guide/XPUAutoShard.html
@@ -4,7 +4,7 @@
   <meta charset="utf-8" /><meta name="viewport" content="width=device-width, initial-scale=1" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-  <title>XPUAutoShard on GPU [Experimental] &mdash; Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation</title>
+  <title>XPUAutoShard on GPU [Experimental] &mdash; Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation</title>
       <link rel="stylesheet" type="text/css" href="../../_static/pygments.css?v=fa44fd50" />
       <link rel="stylesheet" type="text/css" href="../../_static/css/theme.css?v=19f00094" />
       <link rel="stylesheet" type="text/css" href="../../_static/custom.css?v=439db15d" />
@@ -194,7 +194,7 @@ <h3>Examples<a class="headerlink" href="#examples" title="Link to this heading">
   Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
     <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
     provided by <a href="https://readthedocs.org">Read the Docs</a>.
-   <jinja2.runtime.BlockReference object at 0x7f4a4a116890> 
+   <jinja2.runtime.BlockReference object at 0x7f124ccd2da0> 
   <p></p><div><a href='https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html' data-cookie-notice='true'>Cookies</a> <a href='https://www.intel.com/content/www/us/en/privacy/intel-privacy-notice.html'>| Privacy</a></div>
 
 
diff --git a/latest/docs/guide/aamp_tune.html b/latest/docs/guide/aamp_tune.html
index f6d02bd7d..1f553f2f9 100644
--- a/latest/docs/guide/aamp_tune.html
+++ b/latest/docs/guide/aamp_tune.html
@@ -4,7 +4,7 @@
   <meta charset="utf-8" /><meta name="viewport" content="width=device-width, initial-scale=1" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-  <title>Tune Advanced Auto Mixed Precision &mdash; Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation</title>
+  <title>Tune Advanced Auto Mixed Precision &mdash; Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation</title>
       <link rel="stylesheet" type="text/css" href="../../_static/pygments.css?v=fa44fd50" />
       <link rel="stylesheet" type="text/css" href="../../_static/css/theme.css?v=19f00094" />
       <link rel="stylesheet" type="text/css" href="../../_static/custom.css?v=439db15d" />
@@ -439,7 +439,7 @@ <h3>Tuning Performance Example on MobileNet<a class="headerlink" href="#tuning-p
   Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
     <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
     provided by <a href="https://readthedocs.org">Read the Docs</a>.
-   <jinja2.runtime.BlockReference object at 0x7f4a4a0f54b0> 
+   <jinja2.runtime.BlockReference object at 0x7f124cd55c60> 
   <p></p><div><a href='https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html' data-cookie-notice='true'>Cookies</a> <a href='https://www.intel.com/content/www/us/en/privacy/intel-privacy-notice.html'>| Privacy</a></div>
 
 
diff --git a/latest/docs/guide/advanced_auto_mixed_precision.html b/latest/docs/guide/advanced_auto_mixed_precision.html
index 47ce26c57..c01c91932 100644
--- a/latest/docs/guide/advanced_auto_mixed_precision.html
+++ b/latest/docs/guide/advanced_auto_mixed_precision.html
@@ -4,7 +4,7 @@
   <meta charset="utf-8" /><meta name="viewport" content="width=device-width, initial-scale=1" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-  <title>Advanced Auto Mixed Precision &mdash; Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation</title>
+  <title>Advanced Auto Mixed Precision &mdash; Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation</title>
       <link rel="stylesheet" type="text/css" href="../../_static/pygments.css?v=fa44fd50" />
       <link rel="stylesheet" type="text/css" href="../../_static/css/theme.css?v=19f00094" />
       <link rel="stylesheet" type="text/css" href="../../_static/custom.css?v=439db15d" />
@@ -420,7 +420,7 @@ <h3>Custom Operation<a class="headerlink" href="#custom-operation" title="Link t
   Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
     <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
     provided by <a href="https://readthedocs.org">Read the Docs</a>.
-   <jinja2.runtime.BlockReference object at 0x7f4a4a0d2920> 
+   <jinja2.runtime.BlockReference object at 0x7f124cd7b220> 
   <p></p><div><a href='https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html' data-cookie-notice='true'>Cookies</a> <a href='https://www.intel.com/content/www/us/en/privacy/intel-privacy-notice.html'>| Privacy</a></div>
 
 
diff --git a/latest/docs/guide/environment_variables.html b/latest/docs/guide/environment_variables.html
index e25b2230f..063de7ff5 100644
--- a/latest/docs/guide/environment_variables.html
+++ b/latest/docs/guide/environment_variables.html
@@ -4,7 +4,7 @@
   <meta charset="utf-8" /><meta name="viewport" content="width=device-width, initial-scale=1" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-  <title>Environment Variables &mdash; Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation</title>
+  <title>Environment Variables &mdash; Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation</title>
       <link rel="stylesheet" type="text/css" href="../../_static/pygments.css?v=fa44fd50" />
       <link rel="stylesheet" type="text/css" href="../../_static/css/theme.css?v=19f00094" />
       <link rel="stylesheet" type="text/css" href="../../_static/custom.css?v=439db15d" />
@@ -234,7 +234,7 @@ <h3>Auto Mixed Precision Options<a class="headerlink" href="#auto-mixed-precisio
   Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
     <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
     provided by <a href="https://readthedocs.org">Read the Docs</a>.
-   <jinja2.runtime.BlockReference object at 0x7f4a4a92cb20> 
+   <jinja2.runtime.BlockReference object at 0x7f124d0b4100> 
   <p></p><div><a href='https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html' data-cookie-notice='true'>Cookies</a> <a href='https://www.intel.com/content/www/us/en/privacy/intel-privacy-notice.html'>| Privacy</a></div>
 
 
diff --git a/latest/docs/guide/features.html b/latest/docs/guide/features.html
index 41d90a796..6227426a4 100644
--- a/latest/docs/guide/features.html
+++ b/latest/docs/guide/features.html
@@ -4,7 +4,7 @@
   <meta charset="utf-8" /><meta name="viewport" content="width=device-width, initial-scale=1" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-  <title>Features &mdash; Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation</title>
+  <title>Features &mdash; Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation</title>
       <link rel="stylesheet" type="text/css" href="../../_static/pygments.css?v=fa44fd50" />
       <link rel="stylesheet" type="text/css" href="../../_static/css/theme.css?v=19f00094" />
       <link rel="stylesheet" type="text/css" href="../../_static/custom.css?v=439db15d" />
@@ -227,7 +227,7 @@ <h2>TensorFlow Serving<a class="headerlink" href="#tensorflow-serving" title="Li
   Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
     <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
     provided by <a href="https://readthedocs.org">Read the Docs</a>.
-   <jinja2.runtime.BlockReference object at 0x7f4a4a92c790> 
+   <jinja2.runtime.BlockReference object at 0x7f124d4d33a0> 
   <p></p><div><a href='https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html' data-cookie-notice='true'>Cookies</a> <a href='https://www.intel.com/content/www/us/en/privacy/intel-privacy-notice.html'>| Privacy</a></div>
 
 
diff --git a/latest/docs/guide/how_to_enable_profiler.html b/latest/docs/guide/how_to_enable_profiler.html
index 256b2eb97..a2fe76fd7 100644
--- a/latest/docs/guide/how_to_enable_profiler.html
+++ b/latest/docs/guide/how_to_enable_profiler.html
@@ -4,7 +4,7 @@
   <meta charset="utf-8" /><meta name="viewport" content="width=device-width, initial-scale=1" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-  <title>GPU Profiler &mdash; Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation</title>
+  <title>GPU Profiler &mdash; Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation</title>
       <link rel="stylesheet" type="text/css" href="../../_static/pygments.css?v=fa44fd50" />
       <link rel="stylesheet" type="text/css" href="../../_static/css/theme.css?v=19f00094" />
       <link rel="stylesheet" type="text/css" href="../../_static/custom.css?v=439db15d" />
@@ -212,7 +212,7 @@ <h2>FAQ<a class="headerlink" href="#faq" title="Link to this heading"></a></h
   Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
     <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
     provided by <a href="https://readthedocs.org">Read the Docs</a>.
-   <jinja2.runtime.BlockReference object at 0x7f4a4a266200> 
+   <jinja2.runtime.BlockReference object at 0x7f124d3f1270> 
   <p></p><div><a href='https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html' data-cookie-notice='true'>Cookies</a> <a href='https://www.intel.com/content/www/us/en/privacy/intel-privacy-notice.html'>| Privacy</a></div>
 
 
diff --git a/latest/docs/guide/infrastructure.html b/latest/docs/guide/infrastructure.html
index 4416ecf43..89f538f8c 100644
--- a/latest/docs/guide/infrastructure.html
+++ b/latest/docs/guide/infrastructure.html
@@ -4,7 +4,7 @@
   <meta charset="utf-8" /><meta name="viewport" content="width=device-width, initial-scale=1" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-  <title>Infrastructure &mdash; Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation</title>
+  <title>Infrastructure &mdash; Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation</title>
       <link rel="stylesheet" type="text/css" href="../../_static/pygments.css?v=fa44fd50" />
       <link rel="stylesheet" type="text/css" href="../../_static/css/theme.css?v=19f00094" />
       <link rel="stylesheet" type="text/css" href="../../_static/custom.css?v=439db15d" />
@@ -147,7 +147,7 @@ <h2>XPU Engine<a class="headerlink" href="#xpu-engine" title="Link to this headi
   Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
     <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
     provided by <a href="https://readthedocs.org">Read the Docs</a>.
-   <jinja2.runtime.BlockReference object at 0x7f4a4aa562c0> 
+   <jinja2.runtime.BlockReference object at 0x7f124f0503a0> 
   <p></p><div><a href='https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html' data-cookie-notice='true'>Cookies</a> <a href='https://www.intel.com/content/www/us/en/privacy/intel-privacy-notice.html'>| Privacy</a></div>
 
 
diff --git a/latest/docs/guide/itex_fusion.html b/latest/docs/guide/itex_fusion.html
index 616e16cd9..ae4043d82 100644
--- a/latest/docs/guide/itex_fusion.html
+++ b/latest/docs/guide/itex_fusion.html
@@ -4,7 +4,7 @@
   <meta charset="utf-8" /><meta name="viewport" content="width=device-width, initial-scale=1" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-  <title>Graph fusion &mdash; Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation</title>
+  <title>Graph fusion &mdash; Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation</title>
       <link rel="stylesheet" type="text/css" href="../../_static/pygments.css?v=fa44fd50" />
       <link rel="stylesheet" type="text/css" href="../../_static/css/theme.css?v=19f00094" />
       <link rel="stylesheet" type="text/css" href="../../_static/custom.css?v=439db15d" />
@@ -315,7 +315,7 @@ <h2>Generic layout optimizer<a class="headerlink" href="#generic-layout-optimize
   Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
     <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
     provided by <a href="https://readthedocs.org">Read the Docs</a>.
-   <jinja2.runtime.BlockReference object at 0x7f4a4aa551e0> 
+   <jinja2.runtime.BlockReference object at 0x7f124cef3220> 
   <p></p><div><a href='https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html' data-cookie-notice='true'>Cookies</a> <a href='https://www.intel.com/content/www/us/en/privacy/intel-privacy-notice.html'>| Privacy</a></div>
 
 
diff --git a/latest/docs/guide/itex_ops.html b/latest/docs/guide/itex_ops.html
index ede1dbe66..c78caf275 100644
--- a/latest/docs/guide/itex_ops.html
+++ b/latest/docs/guide/itex_ops.html
@@ -4,7 +4,7 @@
   <meta charset="utf-8" /><meta name="viewport" content="width=device-width, initial-scale=1" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-  <title>Customized Operators &mdash; Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation</title>
+  <title>Customized Operators &mdash; Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation</title>
       <link rel="stylesheet" type="text/css" href="../../_static/pygments.css?v=fa44fd50" />
       <link rel="stylesheet" type="text/css" href="../../_static/css/theme.css?v=19f00094" />
       <link rel="stylesheet" type="text/css" href="../../_static/custom.css?v=439db15d" />
@@ -305,7 +305,7 @@ <h2><code class="docutils literal notranslate"><span class="pre">itex.ops.ItexLS
   Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
     <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
     provided by <a href="https://readthedocs.org">Read the Docs</a>.
-   <jinja2.runtime.BlockReference object at 0x7f4a4a77b9a0> 
+   <jinja2.runtime.BlockReference object at 0x7f124d3adf00> 
   <p></p><div><a href='https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html' data-cookie-notice='true'>Cookies</a> <a href='https://www.intel.com/content/www/us/en/privacy/intel-privacy-notice.html'>| Privacy</a></div>
 
 
diff --git a/latest/docs/guide/itex_ops_override.html b/latest/docs/guide/itex_ops_override.html
index 814d61fe7..502bc059f 100644
--- a/latest/docs/guide/itex_ops_override.html
+++ b/latest/docs/guide/itex_ops_override.html
@@ -4,7 +4,7 @@
   <meta charset="utf-8" /><meta name="viewport" content="width=device-width, initial-scale=1" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-  <title>Operators Override &mdash; Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation</title>
+  <title>Operators Override &mdash; Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation</title>
       <link rel="stylesheet" type="text/css" href="../../_static/pygments.css?v=fa44fd50" />
       <link rel="stylesheet" type="text/css" href="../../_static/css/theme.css?v=19f00094" />
       <link rel="stylesheet" type="text/css" href="../../_static/custom.css?v=439db15d" />
@@ -213,7 +213,7 @@ <h2>AdamW<a class="headerlink" href="#adamw" title="Link to this heading"></a
   Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
     <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
     provided by <a href="https://readthedocs.org">Read the Docs</a>.
-   <jinja2.runtime.BlockReference object at 0x7f4a4adbb4c0> 
+   <jinja2.runtime.BlockReference object at 0x7f124da24910> 
   <p></p><div><a href='https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html' data-cookie-notice='true'>Cookies</a> <a href='https://www.intel.com/content/www/us/en/privacy/intel-privacy-notice.html'>| Privacy</a></div>
 
 
diff --git a/latest/docs/guide/keras3_support.html b/latest/docs/guide/keras3_support.html
index 3ccfbfc5d..af4c06d14 100644
--- a/latest/docs/guide/keras3_support.html
+++ b/latest/docs/guide/keras3_support.html
@@ -4,7 +4,7 @@
   <meta charset="utf-8" /><meta name="viewport" content="width=device-width, initial-scale=1" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-  <title>Keras 3 Overview &mdash; Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation</title>
+  <title>Keras 3 Overview &mdash; Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation</title>
       <link rel="stylesheet" type="text/css" href="../../_static/pygments.css?v=fa44fd50" />
       <link rel="stylesheet" type="text/css" href="../../_static/css/theme.css?v=19f00094" />
       <link rel="stylesheet" type="text/css" href="../../_static/custom.css?v=439db15d" />
@@ -234,7 +234,7 @@ <h2>Situations leads to warning or Error<a class="headerlink" href="#situations-
   Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
     <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
     provided by <a href="https://readthedocs.org">Read the Docs</a>.
-   <jinja2.runtime.BlockReference object at 0x7f4a4a92cca0> 
+   <jinja2.runtime.BlockReference object at 0x7f124dbb6e90> 
   <p></p><div><a href='https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html' data-cookie-notice='true'>Cookies</a> <a href='https://www.intel.com/content/www/us/en/privacy/intel-privacy-notice.html'>| Privacy</a></div>
 
 
diff --git a/latest/docs/guide/keras_mixed_precision.html b/latest/docs/guide/keras_mixed_precision.html
index 798507445..1c7ac29cb 100644
--- a/latest/docs/guide/keras_mixed_precision.html
+++ b/latest/docs/guide/keras_mixed_precision.html
@@ -4,7 +4,7 @@
   <meta charset="utf-8" /><meta name="viewport" content="width=device-width, initial-scale=1" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-  <title>Keras Mixed Precision &mdash; Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation</title>
+  <title>Keras Mixed Precision &mdash; Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation</title>
       <link rel="stylesheet" type="text/css" href="../../_static/pygments.css?v=fa44fd50" />
       <link rel="stylesheet" type="text/css" href="../../_static/css/theme.css?v=19f00094" />
       <link rel="stylesheet" type="text/css" href="../../_static/custom.css?v=439db15d" />
@@ -417,7 +417,7 @@ <h2>Training the model with a custom training loop<a class="headerlink" href="#t
   Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
     <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
     provided by <a href="https://readthedocs.org">Read the Docs</a>.
-   <jinja2.runtime.BlockReference object at 0x7f4a4a92c3d0> 
+   <jinja2.runtime.BlockReference object at 0x7f124d038c70> 
   <p></p><div><a href='https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html' data-cookie-notice='true'>Cookies</a> <a href='https://www.intel.com/content/www/us/en/privacy/intel-privacy-notice.html'>| Privacy</a></div>
 
 
diff --git a/latest/docs/guide/launch.html b/latest/docs/guide/launch.html
index 3341db74d..a1e0e1f61 100644
--- a/latest/docs/guide/launch.html
+++ b/latest/docs/guide/launch.html
@@ -4,7 +4,7 @@
   <meta charset="utf-8" /><meta name="viewport" content="width=device-width, initial-scale=1" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-  <title>Launch Script User Guide &mdash; Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation</title>
+  <title>Launch Script User Guide &mdash; Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation</title>
       <link rel="stylesheet" type="text/css" href="../../_static/pygments.css?v=fa44fd50" />
       <link rel="stylesheet" type="text/css" href="../../_static/css/theme.css?v=19f00094" />
       <link rel="stylesheet" type="text/css" href="../../_static/custom.css?v=439db15d" />
@@ -913,7 +913,7 @@ <h4>Default memory allocator<a class="headerlink" href="#default-memory-allocato
   Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
     <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
     provided by <a href="https://readthedocs.org">Read the Docs</a>.
-   <jinja2.runtime.BlockReference object at 0x7f4a4a266140> 
+   <jinja2.runtime.BlockReference object at 0x7f124f052fb0> 
   <p></p><div><a href='https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html' data-cookie-notice='true'>Cookies</a> <a href='https://www.intel.com/content/www/us/en/privacy/intel-privacy-notice.html'>| Privacy</a></div>
 
 
diff --git a/latest/docs/guide/next_pluggable_device.html b/latest/docs/guide/next_pluggable_device.html
index ba519f3d6..2e6a7e3e1 100644
--- a/latest/docs/guide/next_pluggable_device.html
+++ b/latest/docs/guide/next_pluggable_device.html
@@ -4,7 +4,7 @@
   <meta charset="utf-8" /><meta name="viewport" content="width=device-width, initial-scale=1" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-  <title>NextPluggableDevice Overview &mdash; Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation</title>
+  <title>NextPluggableDevice Overview &mdash; Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation</title>
       <link rel="stylesheet" type="text/css" href="../../_static/pygments.css?v=fa44fd50" />
       <link rel="stylesheet" type="text/css" href="../../_static/css/theme.css?v=19f00094" />
       <link rel="stylesheet" type="text/css" href="../../_static/custom.css?v=439db15d" />
@@ -176,7 +176,7 @@ <h3>Check Currently Used Device Type<a class="headerlink" href="#check-currently
   Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
     <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
     provided by <a href="https://readthedocs.org">Read the Docs</a>.
-   <jinja2.runtime.BlockReference object at 0x7f4a4af865f0> 
+   <jinja2.runtime.BlockReference object at 0x7f124f053400> 
   <p></p><div><a href='https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html' data-cookie-notice='true'>Cookies</a> <a href='https://www.intel.com/content/www/us/en/privacy/intel-privacy-notice.html'>| Privacy</a></div>
 
 
diff --git a/latest/docs/guide/performance.html b/latest/docs/guide/performance.html
index aac770539..0cd4a93e8 100644
--- a/latest/docs/guide/performance.html
+++ b/latest/docs/guide/performance.html
@@ -4,7 +4,7 @@
   <meta charset="utf-8" /><meta name="viewport" content="width=device-width, initial-scale=1" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-  <title>Performance Data &mdash; Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation</title>
+  <title>Performance Data &mdash; Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation</title>
       <link rel="stylesheet" type="text/css" href="../../_static/pygments.css?v=fa44fd50" />
       <link rel="stylesheet" type="text/css" href="../../_static/css/theme.css?v=19f00094" />
       <link rel="stylesheet" type="text/css" href="../../_static/custom.css?v=439db15d" />
@@ -984,7 +984,7 @@ <h2>Additional Performance Data for Intel AI Data Center Products<a class="heade
   Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
     <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
     provided by <a href="https://readthedocs.org">Read the Docs</a>.
-   <jinja2.runtime.BlockReference object at 0x7f4a4ae00460> 
+   <jinja2.runtime.BlockReference object at 0x7f124da260b0> 
   <p></p><div><a href='https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html' data-cookie-notice='true'>Cookies</a> <a href='https://www.intel.com/content/www/us/en/privacy/intel-privacy-notice.html'>| Privacy</a></div>
 
 
diff --git a/latest/docs/guide/practice_guide.html b/latest/docs/guide/practice_guide.html
index f3a3763a1..8b154d013 100644
--- a/latest/docs/guide/practice_guide.html
+++ b/latest/docs/guide/practice_guide.html
@@ -4,7 +4,7 @@
   <meta charset="utf-8" /><meta name="viewport" content="width=device-width, initial-scale=1" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-  <title>Practice Guide &mdash; Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation</title>
+  <title>Practice Guide &mdash; Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation</title>
       <link rel="stylesheet" type="text/css" href="../../_static/pygments.css?v=fa44fd50" />
       <link rel="stylesheet" type="text/css" href="../../_static/css/theme.css?v=19f00094" />
       <link rel="stylesheet" type="text/css" href="../../_static/custom.css?v=439db15d" />
@@ -324,7 +324,7 @@ <h2>GPU Practice Guide<a class="headerlink" href="#gpu-practice-guide" title="Li
   Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
     <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
     provided by <a href="https://readthedocs.org">Read the Docs</a>.
-   <jinja2.runtime.BlockReference object at 0x7f4a4a0e4550> 
+   <jinja2.runtime.BlockReference object at 0x7f124dae8430> 
   <p></p><div><a href='https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html' data-cookie-notice='true'>Cookies</a> <a href='https://www.intel.com/content/www/us/en/privacy/intel-privacy-notice.html'>| Privacy</a></div>
 
 
diff --git a/latest/docs/guide/python_api.html b/latest/docs/guide/python_api.html
index 09cfd42d6..f7f00b3fb 100644
--- a/latest/docs/guide/python_api.html
+++ b/latest/docs/guide/python_api.html
@@ -4,7 +4,7 @@
   <meta charset="utf-8" /><meta name="viewport" content="width=device-width, initial-scale=1" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-  <title>Python APIs &mdash; Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation</title>
+  <title>Python APIs &mdash; Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation</title>
       <link rel="stylesheet" type="text/css" href="../../_static/pygments.css?v=fa44fd50" />
       <link rel="stylesheet" type="text/css" href="../../_static/css/theme.css?v=19f00094" />
       <link rel="stylesheet" type="text/css" href="../../_static/custom.css?v=439db15d" />
@@ -503,7 +503,7 @@ <h2>itex version<a class="headerlink" href="#itex-version" title="Link to this h
   Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
     <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
     provided by <a href="https://readthedocs.org">Read the Docs</a>.
-   <jinja2.runtime.BlockReference object at 0x7f4a4ae00310> 
+   <jinja2.runtime.BlockReference object at 0x7f124da6c580> 
   <p></p><div><a href='https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html' data-cookie-notice='true'>Cookies</a> <a href='https://www.intel.com/content/www/us/en/privacy/intel-privacy-notice.html'>| Privacy</a></div>
 
 
diff --git a/latest/docs/guide/tf_serving_install.html b/latest/docs/guide/tf_serving_install.html
index 2c4229146..96a6c09fb 100644
--- a/latest/docs/guide/tf_serving_install.html
+++ b/latest/docs/guide/tf_serving_install.html
@@ -4,7 +4,7 @@
   <meta charset="utf-8" /><meta name="viewport" content="width=device-width, initial-scale=1" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-  <title>Install TensorFlow Serving with Intel® Extension for TensorFlow* &mdash; Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation</title>
+  <title>Install TensorFlow Serving with Intel® Extension for TensorFlow* &mdash; Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation</title>
       <link rel="stylesheet" type="text/css" href="../../_static/pygments.css?v=fa44fd50" />
       <link rel="stylesheet" type="text/css" href="../../_static/css/theme.css?v=19f00094" />
       <link rel="stylesheet" type="text/css" href="../../_static/custom.css?v=439db15d" />
@@ -370,7 +370,7 @@ <h2>Run sample<a class="headerlink" href="#run-sample" title="Link to this headi
   Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
     <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
     provided by <a href="https://readthedocs.org">Read the Docs</a>.
-   <jinja2.runtime.BlockReference object at 0x7f4a4a92dab0> 
+   <jinja2.runtime.BlockReference object at 0x7f124d039c60> 
   <p></p><div><a href='https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html' data-cookie-notice='true'>Cookies</a> <a href='https://www.intel.com/content/www/us/en/privacy/intel-privacy-notice.html'>| Privacy</a></div>
 
 
diff --git a/latest/docs/guide/threadpool.html b/latest/docs/guide/threadpool.html
index 8b57cb475..41c292ebb 100644
--- a/latest/docs/guide/threadpool.html
+++ b/latest/docs/guide/threadpool.html
@@ -4,7 +4,7 @@
   <meta charset="utf-8" /><meta name="viewport" content="width=device-width, initial-scale=1" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-  <title>Selecting Thread Pool in Intel® Extension for TensorFlow* CPU [Experimental] &mdash; Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation</title>
+  <title>Selecting Thread Pool in Intel® Extension for TensorFlow* CPU [Experimental] &mdash; Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation</title>
       <link rel="stylesheet" type="text/css" href="../../_static/pygments.css?v=fa44fd50" />
       <link rel="stylesheet" type="text/css" href="../../_static/css/theme.css?v=19f00094" />
       <link rel="stylesheet" type="text/css" href="../../_static/custom.css?v=439db15d" />
@@ -303,7 +303,7 @@ <h2>Example<a class="headerlink" href="#example" title="Link to this heading">
   Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
     <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
     provided by <a href="https://readthedocs.org">Read the Docs</a>.
-   <jinja2.runtime.BlockReference object at 0x7f4a4a265120> 
+   <jinja2.runtime.BlockReference object at 0x7f124dbb6b60> 
   <p></p><div><a href='https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html' data-cookie-notice='true'>Cookies</a> <a href='https://www.intel.com/content/www/us/en/privacy/intel-privacy-notice.html'>| Privacy</a></div>
 
 
diff --git a/latest/docs/guide/weight_prepack.html b/latest/docs/guide/weight_prepack.html
index d18cf0710..7aeabc023 100644
--- a/latest/docs/guide/weight_prepack.html
+++ b/latest/docs/guide/weight_prepack.html
@@ -4,7 +4,7 @@
   <meta charset="utf-8" /><meta name="viewport" content="width=device-width, initial-scale=1" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-  <title>Online Weight Prepack &mdash; Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation</title>
+  <title>Online Weight Prepack &mdash; Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation</title>
       <link rel="stylesheet" type="text/css" href="../../_static/pygments.css?v=fa44fd50" />
       <link rel="stylesheet" type="text/css" href="../../_static/css/theme.css?v=19f00094" />
       <link rel="stylesheet" type="text/css" href="../../_static/custom.css?v=439db15d" />
@@ -166,7 +166,7 @@ <h2>Reference<a class="headerlink" href="#reference" title="Link to this heading
   Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
     <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
     provided by <a href="https://readthedocs.org">Read the Docs</a>.
-   <jinja2.runtime.BlockReference object at 0x7f4a4a92e8f0> 
+   <jinja2.runtime.BlockReference object at 0x7f124dbb7ac0> 
   <p></p><div><a href='https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html' data-cookie-notice='true'>Cookies</a> <a href='https://www.intel.com/content/www/us/en/privacy/intel-privacy-notice.html'>| Privacy</a></div>
 
 
diff --git a/latest/docs/install/experimental/install_for_arc_gpu.html b/latest/docs/install/experimental/install_for_arc_gpu.html
index a96a991d6..f9cc47a7a 100644
--- a/latest/docs/install/experimental/install_for_arc_gpu.html
+++ b/latest/docs/install/experimental/install_for_arc_gpu.html
@@ -4,7 +4,7 @@
   <meta charset="utf-8" /><meta name="viewport" content="width=device-width, initial-scale=1" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-  <title>Experimental: Intel® Arc™ A-Series GPU Software Installation &mdash; Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation</title>
+  <title>Experimental: Intel® Arc™ A-Series GPU Software Installation &mdash; Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation</title>
       <link rel="stylesheet" type="text/css" href="../../../_static/pygments.css?v=fa44fd50" />
       <link rel="stylesheet" type="text/css" href="../../../_static/css/theme.css?v=19f00094" />
       <link rel="stylesheet" type="text/css" href="../../../_static/custom.css?v=439db15d" />
@@ -188,7 +188,7 @@ <h5>Ubuntu Linux Installed in WSL2<a class="headerlink" href="#ubuntu-linux-inst
 <div class="highlight-bash notranslate"><div class="highlight"><pre><span></span>sudo<span class="w"> </span>apt-get<span class="w"> </span>install<span class="w"> </span>-y<span class="w"> </span>gpg-agent<span class="w"> </span>wget
 wget<span class="w"> </span>-qO<span class="w"> </span>-<span class="w"> </span>https://repositories.intel.com/gpu/intel-graphics.key<span class="w"> </span><span class="p">|</span><span class="w"> </span>
 sudo<span class="w"> </span>gpg<span class="w"> </span>--dearmor<span class="w"> </span>--output<span class="w"> </span>/usr/share/keyrings/intel-graphics.gpg
-<span class="nb">echo</span><span class="w"> </span><span class="s2">&quot;deb [arch=.html64 signed-by=/usr/share/keyrings/intel-graphics.gpg] https://repositories.intel.com/gpu/ubuntu jammy/lts/2350 unified&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>sudo<span class="w"> </span>tee<span class="w"> </span>/etc/apt/sources.list.d/intel-gpu-jammy.list
+<span class="nb">echo</span><span class="w"> </span><span class="s2">&quot;deb [arch=amd64 signed-by=/usr/share/keyrings/intel-graphics.gpg] https://repositories.intel.com/gpu/ubuntu jammy/lts/2350 unified&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>sudo<span class="w"> </span>tee<span class="w"> </span>/etc/apt/sources.list.d/intel-gpu-jammy.list
 sudo<span class="w"> </span>apt-get<span class="w"> </span>update
 </pre></div>
 </div>
@@ -245,7 +245,7 @@ <h4>Native Linux Running Directly on Hardware<a class="headerlink" href="#id2" t
 <div class="highlight-bash notranslate"><div class="highlight"><pre><span></span>sudo<span class="w"> </span>apt-get<span class="w"> </span>install<span class="w"> </span>-y<span class="w"> </span>gpg-agent<span class="w"> </span>wget
 wget<span class="w"> </span>-qO<span class="w"> </span>-<span class="w"> </span>https://repositories.intel.com/gpu/intel-graphics.key<span class="w"> </span><span class="p">|</span><span class="w"> </span>
 sudo<span class="w"> </span>gpg<span class="w"> </span>--dearmor<span class="w"> </span>--output<span class="w"> </span>/usr/share/keyrings/intel-graphics.gpg
-<span class="nb">echo</span><span class="w"> </span><span class="s2">&quot;deb [arch=.html64 signed-by=/usr/share/keyrings/intel-graphics.gpg] https://repositories.intel.com/gpu/ubuntu jammy/lts/2350 unified&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>sudo<span class="w"> </span>tee<span class="w"> </span>/etc/apt/sources.list.d/intel-gpu-jammy.list
+<span class="nb">echo</span><span class="w"> </span><span class="s2">&quot;deb [arch=amd64 signed-by=/usr/share/keyrings/intel-graphics.gpg] https://repositories.intel.com/gpu/ubuntu jammy/lts/2350 unified&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>sudo<span class="w"> </span>tee<span class="w"> </span>/etc/apt/sources.list.d/intel-gpu-jammy.list
 sudo<span class="w"> </span>apt-get<span class="w"> </span>update
 </pre></div>
 </div>
@@ -372,7 +372,7 @@ <h4>Setup environment variables<a class="headerlink" href="#setup-environment-va
   Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
     <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
     provided by <a href="https://readthedocs.org">Read the Docs</a>.
-   <jinja2.runtime.BlockReference object at 0x7f4a4a0e43a0> 
+   <jinja2.runtime.BlockReference object at 0x7f124d1da980> 
   <p></p><div><a href='https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html' data-cookie-notice='true'>Cookies</a> <a href='https://www.intel.com/content/www/us/en/privacy/intel-privacy-notice.html'>| Privacy</a></div>
 
 
diff --git a/latest/docs/install/experimental/install_for_gpu_conda.html b/latest/docs/install/experimental/install_for_gpu_conda.html
index 0742b0c08..5f0d47130 100644
--- a/latest/docs/install/experimental/install_for_gpu_conda.html
+++ b/latest/docs/install/experimental/install_for_gpu_conda.html
@@ -4,7 +4,7 @@
   <meta charset="utf-8" /><meta name="viewport" content="width=device-width, initial-scale=1" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-  <title>Conda Environment Installation Instructions &mdash; Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation</title>
+  <title>Conda Environment Installation Instructions &mdash; Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation</title>
       <link rel="stylesheet" type="text/css" href="../../../_static/pygments.css?v=fa44fd50" />
       <link rel="stylesheet" type="text/css" href="../../../_static/css/theme.css?v=19f00094" />
       <link rel="stylesheet" type="text/css" href="../../../_static/custom.css?v=439db15d" />
@@ -193,7 +193,7 @@ <h2>Step by step instructions:<a class="headerlink" href="#step-by-step-instruct
   Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
     <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
     provided by <a href="https://readthedocs.org">Read the Docs</a>.
-   <jinja2.runtime.BlockReference object at 0x7f4a4a0d2cb0> 
+   <jinja2.runtime.BlockReference object at 0x7f124cd78c40> 
   <p></p><div><a href='https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html' data-cookie-notice='true'>Cookies</a> <a href='https://www.intel.com/content/www/us/en/privacy/intel-privacy-notice.html'>| Privacy</a></div>
 
 
diff --git a/latest/docs/install/how_to_build.html b/latest/docs/install/how_to_build.html
index f77318030..309adf8d9 100644
--- a/latest/docs/install/how_to_build.html
+++ b/latest/docs/install/how_to_build.html
@@ -4,7 +4,7 @@
   <meta charset="utf-8" /><meta name="viewport" content="width=device-width, initial-scale=1" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-  <title>Overview &mdash; Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation</title>
+  <title>Overview &mdash; Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation</title>
       <link rel="stylesheet" type="text/css" href="../../_static/pygments.css?v=fa44fd50" />
       <link rel="stylesheet" type="text/css" href="../../_static/css/theme.css?v=19f00094" />
       <link rel="stylesheet" type="text/css" href="../../_static/custom.css?v=439db15d" />
@@ -519,7 +519,7 @@ <h2>Configure Example For XPU<a class="headerlink" href="#configure-example-for-
   Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
     <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
     provided by <a href="https://readthedocs.org">Read the Docs</a>.
-   <jinja2.runtime.BlockReference object at 0x7f4a4a03fe80> 
+   <jinja2.runtime.BlockReference object at 0x7f124cd8c5e0> 
   <p></p><div><a href='https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html' data-cookie-notice='true'>Cookies</a> <a href='https://www.intel.com/content/www/us/en/privacy/intel-privacy-notice.html'>| Privacy</a></div>
 
 
diff --git a/latest/docs/install/install_for_cpp.html b/latest/docs/install/install_for_cpp.html
index 2167ac655..c17f67b2e 100644
--- a/latest/docs/install/install_for_cpp.html
+++ b/latest/docs/install/install_for_cpp.html
@@ -4,7 +4,7 @@
   <meta charset="utf-8" /><meta name="viewport" content="width=device-width, initial-scale=1" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-  <title>Intel® Extension for TensorFlow* for C++ &mdash; Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation</title>
+  <title>Intel® Extension for TensorFlow* for C++ &mdash; Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation</title>
       <link rel="stylesheet" type="text/css" href="../../_static/pygments.css?v=fa44fd50" />
       <link rel="stylesheet" type="text/css" href="../../_static/css/theme.css?v=19f00094" />
       <link rel="stylesheet" type="text/css" href="../../_static/custom.css?v=439db15d" />
@@ -537,7 +537,7 @@ <h3>Build and run<a class="headerlink" href="#build-and-run" title="Link to this
   Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
     <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
     provided by <a href="https://readthedocs.org">Read the Docs</a>.
-   <jinja2.runtime.BlockReference object at 0x7f4a4a2668c0> 
+   <jinja2.runtime.BlockReference object at 0x7f124dbb6620> 
   <p></p><div><a href='https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html' data-cookie-notice='true'>Cookies</a> <a href='https://www.intel.com/content/www/us/en/privacy/intel-privacy-notice.html'>| Privacy</a></div>
 
 
diff --git a/latest/docs/install/install_for_cpu.html b/latest/docs/install/install_for_cpu.html
index 87fda059c..aede6219d 100644
--- a/latest/docs/install/install_for_cpu.html
+++ b/latest/docs/install/install_for_cpu.html
@@ -4,7 +4,7 @@
   <meta charset="utf-8" /><meta name="viewport" content="width=device-width, initial-scale=1" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-  <title>Intel CPU Software Installation &mdash; Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation</title>
+  <title>Intel CPU Software Installation &mdash; Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation</title>
       <link rel="stylesheet" type="text/css" href="../../_static/pygments.css?v=fa44fd50" />
       <link rel="stylesheet" type="text/css" href="../../_static/css/theme.css?v=19f00094" />
       <link rel="stylesheet" type="text/css" href="../../_static/custom.css?v=439db15d" />
@@ -220,7 +220,7 @@ <h4>Verify the Installation<a class="headerlink" href="#verify-the-installation"
   Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
     <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
     provided by <a href="https://readthedocs.org">Read the Docs</a>.
-   <jinja2.runtime.BlockReference object at 0x7f4a4c3e5c60> 
+   <jinja2.runtime.BlockReference object at 0x7f124ccd1db0> 
   <p></p><div><a href='https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html' data-cookie-notice='true'>Cookies</a> <a href='https://www.intel.com/content/www/us/en/privacy/intel-privacy-notice.html'>| Privacy</a></div>
 
 
diff --git a/latest/docs/install/install_for_xpu.html b/latest/docs/install/install_for_xpu.html
index 05a991896..9037cad14 100644
--- a/latest/docs/install/install_for_xpu.html
+++ b/latest/docs/install/install_for_xpu.html
@@ -4,7 +4,7 @@
   <meta charset="utf-8" /><meta name="viewport" content="width=device-width, initial-scale=1" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-  <title>Intel XPU Software Installation &mdash; Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation</title>
+  <title>Intel XPU Software Installation &mdash; Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation</title>
       <link rel="stylesheet" type="text/css" href="../../_static/pygments.css?v=fa44fd50" />
       <link rel="stylesheet" type="text/css" href="../../_static/css/theme.css?v=19f00094" />
       <link rel="stylesheet" type="text/css" href="../../_static/custom.css?v=439db15d" />
@@ -321,7 +321,7 @@ <h2>XPU for CPU only platform (Deprecated)<a class="headerlink" href="#xpu-for-c
   Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
     <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
     provided by <a href="https://readthedocs.org">Read the Docs</a>.
-   <jinja2.runtime.BlockReference object at 0x7f4a4a0e7670> 
+   <jinja2.runtime.BlockReference object at 0x7f124daeacb0> 
   <p></p><div><a href='https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html' data-cookie-notice='true'>Cookies</a> <a href='https://www.intel.com/content/www/us/en/privacy/intel-privacy-notice.html'>| Privacy</a></div>
 
 
diff --git a/latest/docs/install/installation_guide.html b/latest/docs/install/installation_guide.html
index f2e694e3b..ff7970843 100644
--- a/latest/docs/install/installation_guide.html
+++ b/latest/docs/install/installation_guide.html
@@ -4,7 +4,7 @@
   <meta charset="utf-8" /><meta name="viewport" content="width=device-width, initial-scale=1" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-  <title>Installation Guide &mdash; Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation</title>
+  <title>Installation Guide &mdash; Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation</title>
       <link rel="stylesheet" type="text/css" href="../../_static/pygments.css?v=fa44fd50" />
       <link rel="stylesheet" type="text/css" href="../../_static/css/theme.css?v=19f00094" />
       <link rel="stylesheet" type="text/css" href="../../_static/custom.css?v=439db15d" />
@@ -133,7 +133,7 @@ <h1>Installation Guide<a class="headerlink" href="#installation-guide" title="Li
   Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
     <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
     provided by <a href="https://readthedocs.org">Read the Docs</a>.
-   <jinja2.runtime.BlockReference object at 0x7f4a4a117cd0> 
+   <jinja2.runtime.BlockReference object at 0x7f124cd56740> 
   <p></p><div><a href='https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html' data-cookie-notice='true'>Cookies</a> <a href='https://www.intel.com/content/www/us/en/privacy/intel-privacy-notice.html'>| Privacy</a></div>
 
 
diff --git a/latest/examples/README.html b/latest/examples/README.html
index dfa309bf7..d4793f36a 100644
--- a/latest/examples/README.html
+++ b/latest/examples/README.html
@@ -4,7 +4,7 @@
   <meta charset="utf-8" /><meta name="viewport" content="width=device-width, initial-scale=1" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-  <title>Examples &mdash; Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation</title>
+  <title>Examples &mdash; Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation</title>
       <link rel="stylesheet" type="text/css" href="../_static/pygments.css?v=fa44fd50" />
       <link rel="stylesheet" type="text/css" href="../_static/css/theme.css?v=19f00094" />
       <link rel="stylesheet" type="text/css" href="../_static/custom.css?v=439db15d" />
@@ -205,7 +205,7 @@ <h2>Examples<a class="headerlink" href="#id1" title="Link to this heading"></
   Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
     <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
     provided by <a href="https://readthedocs.org">Read the Docs</a>.
-   <jinja2.runtime.BlockReference object at 0x7f4a4a116b90> 
+   <jinja2.runtime.BlockReference object at 0x7f124cd57a00> 
   <p></p><div><a href='https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html' data-cookie-notice='true'>Cookies</a> <a href='https://www.intel.com/content/www/us/en/privacy/intel-privacy-notice.html'>| Privacy</a></div>
 
 
diff --git a/latest/examples/accelerate_alexnet_by_quantization/README.html b/latest/examples/accelerate_alexnet_by_quantization/README.html
index 47bb641e5..5693a35d6 100644
--- a/latest/examples/accelerate_alexnet_by_quantization/README.html
+++ b/latest/examples/accelerate_alexnet_by_quantization/README.html
@@ -4,7 +4,7 @@
   <meta charset="utf-8" /><meta name="viewport" content="width=device-width, initial-scale=1" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-  <title>Accelerate AlexNet by Quantization with Intel® Extension for Tensorflow* &mdash; Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation</title>
+  <title>Accelerate AlexNet by Quantization with Intel® Extension for Tensorflow* &mdash; Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation</title>
       <link rel="stylesheet" type="text/css" href="../../_static/pygments.css?v=fa44fd50" />
       <link rel="stylesheet" type="text/css" href="../../_static/css/theme.css?v=19f00094" />
       <link rel="stylesheet" type="text/css" href="../../_static/custom.css?v=439db15d" />
@@ -170,7 +170,7 @@ <h2>Execute<a class="headerlink" href="#execute" title="Link to this heading">
   Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
     <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
     provided by <a href="https://readthedocs.org">Read the Docs</a>.
-   <jinja2.runtime.BlockReference object at 0x7f4a4a03e1d0> 
+   <jinja2.runtime.BlockReference object at 0x7f124cd569e0> 
   <p></p><div><a href='https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html' data-cookie-notice='true'>Cookies</a> <a href='https://www.intel.com/content/www/us/en/privacy/intel-privacy-notice.html'>| Privacy</a></div>
 
 
diff --git a/latest/examples/common_guide_running.html b/latest/examples/common_guide_running.html
index b8d5e67cd..7d04b129d 100644
--- a/latest/examples/common_guide_running.html
+++ b/latest/examples/common_guide_running.html
@@ -4,7 +4,7 @@
   <meta charset="utf-8" /><meta name="viewport" content="width=device-width, initial-scale=1" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-  <title>Common Guide for Running &mdash; Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation</title>
+  <title>Common Guide for Running &mdash; Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation</title>
       <link rel="stylesheet" type="text/css" href="../_static/pygments.css?v=fa44fd50" />
       <link rel="stylesheet" type="text/css" href="../_static/css/theme.css?v=19f00094" />
       <link rel="stylesheet" type="text/css" href="../_static/custom.css?v=439db15d" />
@@ -165,7 +165,7 @@ <h3>Run Script<a class="headerlink" href="#run-script" title="Link to this headi
   Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
     <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
     provided by <a href="https://readthedocs.org">Read the Docs</a>.
-   <jinja2.runtime.BlockReference object at 0x7f4a4a0e4490> 
+   <jinja2.runtime.BlockReference object at 0x7f124d1a6ec0> 
   <p></p><div><a href='https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html' data-cookie-notice='true'>Cookies</a> <a href='https://www.intel.com/content/www/us/en/privacy/intel-privacy-notice.html'>| Privacy</a></div>
 
 
diff --git a/latest/examples/infer_inception_v4_amp/README.html b/latest/examples/infer_inception_v4_amp/README.html
index 2b6747b8a..6e9b425e8 100644
--- a/latest/examples/infer_inception_v4_amp/README.html
+++ b/latest/examples/infer_inception_v4_amp/README.html
@@ -4,7 +4,7 @@
   <meta charset="utf-8" /><meta name="viewport" content="width=device-width, initial-scale=1" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-  <title>Speed up Inference of Inception v4 by Advanced Automatic Mixed Precision on Intel CPU and GPU via Docker Container or Bare Metal &mdash; Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation</title>
+  <title>Speed up Inference of Inception v4 by Advanced Automatic Mixed Precision on Intel CPU and GPU via Docker Container or Bare Metal &mdash; Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation</title>
       <link rel="stylesheet" type="text/css" href="../../_static/pygments.css?v=fa44fd50" />
       <link rel="stylesheet" type="text/css" href="../../_static/css/theme.css?v=19f00094" />
       <link rel="stylesheet" type="text/css" href="../../_static/custom.css?v=439db15d" />
@@ -346,7 +346,7 @@ <h2>FAQ<a class="headerlink" href="#faq" title="Link to this heading"></a></h
   Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
     <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
     provided by <a href="https://readthedocs.org">Read the Docs</a>.
-   <jinja2.runtime.BlockReference object at 0x7f4a4a7791b0> 
+   <jinja2.runtime.BlockReference object at 0x7f124cef3ca0> 
   <p></p><div><a href='https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html' data-cookie-notice='true'>Cookies</a> <a href='https://www.intel.com/content/www/us/en/privacy/intel-privacy-notice.html'>| Privacy</a></div>
 
 
diff --git a/latest/examples/infer_resnet50/README.html b/latest/examples/infer_resnet50/README.html
index d8afa27cb..a77d650c0 100644
--- a/latest/examples/infer_resnet50/README.html
+++ b/latest/examples/infer_resnet50/README.html
@@ -4,7 +4,7 @@
   <meta charset="utf-8" /><meta name="viewport" content="width=device-width, initial-scale=1" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-  <title>ResNet50 Inference on Intel CPU and GPU &mdash; Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation</title>
+  <title>ResNet50 Inference on Intel CPU and GPU &mdash; Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation</title>
       <link rel="stylesheet" type="text/css" href="../../_static/pygments.css?v=fa44fd50" />
       <link rel="stylesheet" type="text/css" href="../../_static/css/theme.css?v=19f00094" />
       <link rel="stylesheet" type="text/css" href="../../_static/custom.css?v=439db15d" />
@@ -165,7 +165,7 @@ <h2>FAQ<a class="headerlink" href="#faq" title="Link to this heading"></a></h
   Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
     <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
     provided by <a href="https://readthedocs.org">Read the Docs</a>.
-   <jinja2.runtime.BlockReference object at 0x7f4a4a92c580> 
+   <jinja2.runtime.BlockReference object at 0x7f124da6c8e0> 
   <p></p><div><a href='https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html' data-cookie-notice='true'>Cookies</a> <a href='https://www.intel.com/content/www/us/en/privacy/intel-privacy-notice.html'>| Privacy</a></div>
 
 
diff --git a/latest/examples/itex_quantization_example/README.html b/latest/examples/itex_quantization_example/README.html
index 3d15a7f4b..618061e1b 100644
--- a/latest/examples/itex_quantization_example/README.html
+++ b/latest/examples/itex_quantization_example/README.html
@@ -4,7 +4,7 @@
   <meta charset="utf-8" /><meta name="viewport" content="width=device-width, initial-scale=1" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-  <title>Intel® Extension for Tensorflow* Model Quantization API Example &mdash; Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation</title>
+  <title>Intel® Extension for Tensorflow* Model Quantization API Example &mdash; Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation</title>
       <link rel="stylesheet" type="text/css" href="../../_static/pygments.css?v=fa44fd50" />
       <link rel="stylesheet" type="text/css" href="../../_static/css/theme.css?v=19f00094" />
       <link rel="stylesheet" type="text/css" href="../../_static/custom.css?v=439db15d" />
@@ -214,7 +214,7 @@ <h2>Run Model Quantization Example:<a class="headerlink" href="#run-model-quanti
   Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
     <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
     provided by <a href="https://readthedocs.org">Read the Docs</a>.
-   <jinja2.runtime.BlockReference object at 0x7f4a4c3e5690> 
+   <jinja2.runtime.BlockReference object at 0x7f124ccd0b80> 
   <p></p><div><a href='https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html' data-cookie-notice='true'>Cookies</a> <a href='https://www.intel.com/content/www/us/en/privacy/intel-privacy-notice.html'>| Privacy</a></div>
 
 
diff --git a/latest/examples/model_zoo_example/README.html b/latest/examples/model_zoo_example/README.html
index af4782886..9e8f581f5 100644
--- a/latest/examples/model_zoo_example/README.html
+++ b/latest/examples/model_zoo_example/README.html
@@ -4,7 +4,7 @@
   <meta charset="utf-8" /><meta name="viewport" content="width=device-width, initial-scale=1" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-  <title>Accelerate Deep Learning Training and Inference for Model Zoo Workloads on Intel GPU &mdash; Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation</title>
+  <title>Accelerate Deep Learning Training and Inference for Model Zoo Workloads on Intel GPU &mdash; Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation</title>
       <link rel="stylesheet" type="text/css" href="../../_static/pygments.css?v=fa44fd50" />
       <link rel="stylesheet" type="text/css" href="../../_static/css/theme.css?v=19f00094" />
       <link rel="stylesheet" type="text/css" href="../../_static/custom.css?v=439db15d" />
@@ -130,7 +130,7 @@ <h3>Run Models on Bare Metal<a class="headerlink" href="#run-models-on-bare-meta
   Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
     <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
     provided by <a href="https://readthedocs.org">Read the Docs</a>.
-   <jinja2.runtime.BlockReference object at 0x7f4a4c3e68f0> 
+   <jinja2.runtime.BlockReference object at 0x7f124ccd2ad0> 
   <p></p><div><a href='https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html' data-cookie-notice='true'>Cookies</a> <a href='https://www.intel.com/content/www/us/en/privacy/intel-privacy-notice.html'>| Privacy</a></div>
 
 
diff --git a/latest/examples/pretrain_bert/README.html b/latest/examples/pretrain_bert/README.html
index 29b6e979e..cc1e12257 100644
--- a/latest/examples/pretrain_bert/README.html
+++ b/latest/examples/pretrain_bert/README.html
@@ -4,7 +4,7 @@
   <meta charset="utf-8" /><meta name="viewport" content="width=device-width, initial-scale=1" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-  <title>Accelerate BERT-Large Pretraining on Intel GPU &mdash; Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation</title>
+  <title>Accelerate BERT-Large Pretraining on Intel GPU &mdash; Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation</title>
       <link rel="stylesheet" type="text/css" href="../../_static/pygments.css?v=fa44fd50" />
       <link rel="stylesheet" type="text/css" href="../../_static/css/theme.css?v=19f00094" />
       <link rel="stylesheet" type="text/css" href="../../_static/custom.css?v=439db15d" />
@@ -527,7 +527,7 @@ <h2>FAQ<a class="headerlink" href="#faq" title="Link to this heading"></a></h
   Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
     <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
     provided by <a href="https://readthedocs.org">Read the Docs</a>.
-   <jinja2.runtime.BlockReference object at 0x7f4a4a92ccd0> 
+   <jinja2.runtime.BlockReference object at 0x7f124d4d29e0> 
   <p></p><div><a href='https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html' data-cookie-notice='true'>Cookies</a> <a href='https://www.intel.com/content/www/us/en/privacy/intel-privacy-notice.html'>| Privacy</a></div>
 
 
diff --git a/latest/examples/quantize_inception_v3/README.html b/latest/examples/quantize_inception_v3/README.html
index 345564eff..ff4c58bef 100644
--- a/latest/examples/quantize_inception_v3/README.html
+++ b/latest/examples/quantize_inception_v3/README.html
@@ -4,7 +4,7 @@
   <meta charset="utf-8" /><meta name="viewport" content="width=device-width, initial-scale=1" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-  <title>Quantize Inception V3 by Intel® Extension for Tensorflow* on Intel® Xeon® &mdash; Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation</title>
+  <title>Quantize Inception V3 by Intel® Extension for Tensorflow* on Intel® Xeon® &mdash; Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation</title>
       <link rel="stylesheet" type="text/css" href="../../_static/pygments.css?v=fa44fd50" />
       <link rel="stylesheet" type="text/css" href="../../_static/css/theme.css?v=19f00094" />
       <link rel="stylesheet" type="text/css" href="../../_static/custom.css?v=439db15d" />
@@ -237,7 +237,7 @@ <h2>License<a class="headerlink" href="#license" title="Link to this heading">
   Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
     <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
     provided by <a href="https://readthedocs.org">Read the Docs</a>.
-   <jinja2.runtime.BlockReference object at 0x7f4a4a0e40d0> 
+   <jinja2.runtime.BlockReference object at 0x7f124da261d0> 
   <p></p><div><a href='https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html' data-cookie-notice='true'>Cookies</a> <a href='https://www.intel.com/content/www/us/en/privacy/intel-privacy-notice.html'>| Privacy</a></div>
 
 
diff --git a/latest/examples/quick_example.html b/latest/examples/quick_example.html
index 0ed6e6372..ec8c99569 100644
--- a/latest/examples/quick_example.html
+++ b/latest/examples/quick_example.html
@@ -4,7 +4,7 @@
   <meta charset="utf-8" /><meta name="viewport" content="width=device-width, initial-scale=1" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-  <title>Quick Example on Intel CPU and GPU &mdash; Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation</title>
+  <title>Quick Example on Intel CPU and GPU &mdash; Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation</title>
       <link rel="stylesheet" type="text/css" href="../_static/pygments.css?v=fa44fd50" />
       <link rel="stylesheet" type="text/css" href="../_static/css/theme.css?v=19f00094" />
       <link rel="stylesheet" type="text/css" href="../_static/custom.css?v=439db15d" />
@@ -196,7 +196,7 @@ <h2>Notes<a class="headerlink" href="#notes" title="Link to this heading"></a
   Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
     <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
     provided by <a href="https://readthedocs.org">Read the Docs</a>.
-   <jinja2.runtime.BlockReference object at 0x7f4a4a0d3010> 
+   <jinja2.runtime.BlockReference object at 0x7f124daeb2b0> 
   <p></p><div><a href='https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html' data-cookie-notice='true'>Cookies</a> <a href='https://www.intel.com/content/www/us/en/privacy/intel-privacy-notice.html'>| Privacy</a></div>
 
 
diff --git a/latest/examples/stable_diffussion_inference/README.html b/latest/examples/stable_diffussion_inference/README.html
index bfa1d3854..2c0be71cc 100644
--- a/latest/examples/stable_diffussion_inference/README.html
+++ b/latest/examples/stable_diffussion_inference/README.html
@@ -4,7 +4,7 @@
   <meta charset="utf-8" /><meta name="viewport" content="width=device-width, initial-scale=1" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-  <title>Stable Diffusion Inference for Text2Image on Intel GPU &mdash; Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation</title>
+  <title>Stable Diffusion Inference for Text2Image on Intel GPU &mdash; Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation</title>
       <link rel="stylesheet" type="text/css" href="../../_static/pygments.css?v=fa44fd50" />
       <link rel="stylesheet" type="text/css" href="../../_static/css/theme.css?v=19f00094" />
       <link rel="stylesheet" type="text/css" href="../../_static/custom.css?v=439db15d" />
@@ -225,7 +225,7 @@ <h2>FAQ<a class="headerlink" href="#faq" title="Link to this heading"></a></h
   Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
     <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
     provided by <a href="https://readthedocs.org">Read the Docs</a>.
-   <jinja2.runtime.BlockReference object at 0x7f4a4a1151e0> 
+   <jinja2.runtime.BlockReference object at 0x7f124cd57490> 
   <p></p><div><a href='https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html' data-cookie-notice='true'>Cookies</a> <a href='https://www.intel.com/content/www/us/en/privacy/intel-privacy-notice.html'>| Privacy</a></div>
 
 
diff --git a/latest/examples/train_3d_unet/README.html b/latest/examples/train_3d_unet/README.html
index 034739705..4ad0a3dff 100644
--- a/latest/examples/train_3d_unet/README.html
+++ b/latest/examples/train_3d_unet/README.html
@@ -4,7 +4,7 @@
   <meta charset="utf-8" /><meta name="viewport" content="width=device-width, initial-scale=1" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-  <title>Accelerate 3D-Unet Training w/o horovod for medical image segmentation on Intel GPU &mdash; Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation</title>
+  <title>Accelerate 3D-Unet Training w/o horovod for medical image segmentation on Intel GPU &mdash; Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation</title>
       <link rel="stylesheet" type="text/css" href="../../_static/pygments.css?v=fa44fd50" />
       <link rel="stylesheet" type="text/css" href="../../_static/css/theme.css?v=19f00094" />
       <link rel="stylesheet" type="text/css" href="../../_static/custom.css?v=439db15d" />
@@ -229,7 +229,7 @@ <h2>FAQ<a class="headerlink" href="#faq" title="Link to this heading"></a></h
   Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
     <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
     provided by <a href="https://readthedocs.org">Read the Docs</a>.
-   <jinja2.runtime.BlockReference object at 0x7f4a4a117ca0> 
+   <jinja2.runtime.BlockReference object at 0x7f124cd55090> 
   <p></p><div><a href='https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html' data-cookie-notice='true'>Cookies</a> <a href='https://www.intel.com/content/www/us/en/privacy/intel-privacy-notice.html'>| Privacy</a></div>
 
 
diff --git a/latest/examples/train_bert/README.html b/latest/examples/train_bert/README.html
index dab3e4c8b..40e90bce4 100644
--- a/latest/examples/train_bert/README.html
+++ b/latest/examples/train_bert/README.html
@@ -4,7 +4,7 @@
   <meta charset="utf-8" /><meta name="viewport" content="width=device-width, initial-scale=1" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-  <title>BERT Training for Classifying Text on Intel CPU and GPU &mdash; Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation</title>
+  <title>BERT Training for Classifying Text on Intel CPU and GPU &mdash; Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation</title>
       <link rel="stylesheet" type="text/css" href="../../_static/pygments.css?v=fa44fd50" />
       <link rel="stylesheet" type="text/css" href="../../_static/css/theme.css?v=19f00094" />
       <link rel="stylesheet" type="text/css" href="../../_static/custom.css?v=439db15d" />
@@ -208,7 +208,7 @@ <h2>FAQ<a class="headerlink" href="#faq" title="Link to this heading"></a></h
   Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
     <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
     provided by <a href="https://readthedocs.org">Read the Docs</a>.
-   <jinja2.runtime.BlockReference object at 0x7f4a4a117670> 
+   <jinja2.runtime.BlockReference object at 0x7f124cd56500> 
   <p></p><div><a href='https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html' data-cookie-notice='true'>Cookies</a> <a href='https://www.intel.com/content/www/us/en/privacy/intel-privacy-notice.html'>| Privacy</a></div>
 
 
diff --git a/latest/examples/train_bert_fp8/README.html b/latest/examples/train_bert_fp8/README.html
index bc7d3964f..a3bc8f4f5 100644
--- a/latest/examples/train_bert_fp8/README.html
+++ b/latest/examples/train_bert_fp8/README.html
@@ -4,7 +4,7 @@
   <meta charset="utf-8" /><meta name="viewport" content="width=device-width, initial-scale=1" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-  <title>FP8 BERT-Large Fine-tuning for Classifying Text on Intel GPU &mdash; Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation</title>
+  <title>FP8 BERT-Large Fine-tuning for Classifying Text on Intel GPU &mdash; Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation</title>
       <link rel="stylesheet" type="text/css" href="../../_static/pygments.css?v=fa44fd50" />
       <link rel="stylesheet" type="text/css" href="../../_static/css/theme.css?v=19f00094" />
       <link rel="stylesheet" type="text/css" href="../../_static/custom.css?v=439db15d" />
@@ -201,7 +201,7 @@ <h2>FAQ<a class="headerlink" href="#faq" title="Link to this heading"></a></h
   Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
     <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
     provided by <a href="https://readthedocs.org">Read the Docs</a>.
-   <jinja2.runtime.BlockReference object at 0x7f4a4a0d14b0> 
+   <jinja2.runtime.BlockReference object at 0x7f124cd78130> 
   <p></p><div><a href='https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html' data-cookie-notice='true'>Cookies</a> <a href='https://www.intel.com/content/www/us/en/privacy/intel-privacy-notice.html'>| Privacy</a></div>
 
 
diff --git a/latest/examples/train_horovod/mnist/README.html b/latest/examples/train_horovod/mnist/README.html
index e68e55251..964b90f29 100644
--- a/latest/examples/train_horovod/mnist/README.html
+++ b/latest/examples/train_horovod/mnist/README.html
@@ -4,7 +4,7 @@
   <meta charset="utf-8" /><meta name="viewport" content="width=device-width, initial-scale=1" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-  <title>Distributed Training Example with Intel® Optimization for Horovod* on Intel® GPU &mdash; Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation</title>
+  <title>Distributed Training Example with Intel® Optimization for Horovod* on Intel® GPU &mdash; Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation</title>
       <link rel="stylesheet" type="text/css" href="../../../_static/pygments.css?v=fa44fd50" />
       <link rel="stylesheet" type="text/css" href="../../../_static/css/theme.css?v=19f00094" />
       <link rel="stylesheet" type="text/css" href="../../../_static/custom.css?v=439db15d" />
@@ -221,7 +221,7 @@ <h2>Output<a class="headerlink" href="#output" title="Link to this heading"><
   Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
     <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
     provided by <a href="https://readthedocs.org">Read the Docs</a>.
-   <jinja2.runtime.BlockReference object at 0x7f4a4a0e7550> 
+   <jinja2.runtime.BlockReference object at 0x7f124ccb8d30> 
   <p></p><div><a href='https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html' data-cookie-notice='true'>Cookies</a> <a href='https://www.intel.com/content/www/us/en/privacy/intel-privacy-notice.html'>| Privacy</a></div>
 
 
diff --git a/latest/examples/train_horovod/resnet50/README.html b/latest/examples/train_horovod/resnet50/README.html
index 76d9031b6..f8e2c5212 100644
--- a/latest/examples/train_horovod/resnet50/README.html
+++ b/latest/examples/train_horovod/resnet50/README.html
@@ -4,7 +4,7 @@
   <meta charset="utf-8" /><meta name="viewport" content="width=device-width, initial-scale=1" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-  <title>Refer to train_resnet50 &mdash; Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation</title>
+  <title>Refer to train_resnet50 &mdash; Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation</title>
       <link rel="stylesheet" type="text/css" href="../../../_static/pygments.css?v=fa44fd50" />
       <link rel="stylesheet" type="text/css" href="../../../_static/css/theme.css?v=19f00094" />
       <link rel="stylesheet" type="text/css" href="../../../_static/custom.css?v=439db15d" />
@@ -108,7 +108,7 @@ <h1>Refer to <a class="reference external" href="../../train_resnet50/README.htm
   Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
     <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
     provided by <a href="https://readthedocs.org">Read the Docs</a>.
-   <jinja2.runtime.BlockReference object at 0x7f4a4ae79150> 
+   <jinja2.runtime.BlockReference object at 0x7f124da6c1f0> 
   <p></p><div><a href='https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html' data-cookie-notice='true'>Cookies</a> <a href='https://www.intel.com/content/www/us/en/privacy/intel-privacy-notice.html'>| Privacy</a></div>
 
 
diff --git a/latest/examples/train_maskrcnn/README.html b/latest/examples/train_maskrcnn/README.html
index b9f950223..3e25168e7 100644
--- a/latest/examples/train_maskrcnn/README.html
+++ b/latest/examples/train_maskrcnn/README.html
@@ -4,7 +4,7 @@
   <meta charset="utf-8" /><meta name="viewport" content="width=device-width, initial-scale=1" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-  <title>Accelerate Mask R-CNN Training on Intel GPU &mdash; Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation</title>
+  <title>Accelerate Mask R-CNN Training on Intel GPU &mdash; Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation</title>
       <link rel="stylesheet" type="text/css" href="../../_static/pygments.css?v=fa44fd50" />
       <link rel="stylesheet" type="text/css" href="../../_static/css/theme.css?v=19f00094" />
       <link rel="stylesheet" type="text/css" href="../../_static/custom.css?v=439db15d" />
@@ -234,7 +234,7 @@ <h2>FAQ<a class="headerlink" href="#faq" title="Link to this heading"></a></h
   Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
     <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
     provided by <a href="https://readthedocs.org">Read the Docs</a>.
-   <jinja2.runtime.BlockReference object at 0x7f4a4c3e7520> 
+   <jinja2.runtime.BlockReference object at 0x7f124d4d39d0> 
   <p></p><div><a href='https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html' data-cookie-notice='true'>Cookies</a> <a href='https://www.intel.com/content/www/us/en/privacy/intel-privacy-notice.html'>| Privacy</a></div>
 
 
diff --git a/latest/examples/train_resnet50/README.html b/latest/examples/train_resnet50/README.html
index 9c0ac2d7f..c6ad15506 100644
--- a/latest/examples/train_resnet50/README.html
+++ b/latest/examples/train_resnet50/README.html
@@ -4,7 +4,7 @@
   <meta charset="utf-8" /><meta name="viewport" content="width=device-width, initial-scale=1" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-  <title>Resnet50 train on Intel GPU &mdash; Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation</title>
+  <title>Resnet50 train on Intel GPU &mdash; Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation</title>
       <link rel="stylesheet" type="text/css" href="../../_static/pygments.css?v=fa44fd50" />
       <link rel="stylesheet" type="text/css" href="../../_static/css/theme.css?v=19f00094" />
       <link rel="stylesheet" type="text/css" href="../../_static/custom.css?v=439db15d" />
@@ -252,7 +252,7 @@ <h2>Example Output with hvd<a class="headerlink" href="#example-output-with-hvd"
   Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
     <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
     provided by <a href="https://readthedocs.org">Read the Docs</a>.
-   <jinja2.runtime.BlockReference object at 0x7f4a4a0f5e70> 
+   <jinja2.runtime.BlockReference object at 0x7f124ccd3310> 
   <p></p><div><a href='https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html' data-cookie-notice='true'>Cookies</a> <a href='https://www.intel.com/content/www/us/en/privacy/intel-privacy-notice.html'>| Privacy</a></div>
 
 
diff --git a/latest/examples/train_resnet50_with_autoshard/README.html b/latest/examples/train_resnet50_with_autoshard/README.html
index 81938cde0..651b26ad0 100644
--- a/latest/examples/train_resnet50_with_autoshard/README.html
+++ b/latest/examples/train_resnet50_with_autoshard/README.html
@@ -4,7 +4,7 @@
   <meta charset="utf-8" /><meta name="viewport" content="width=device-width, initial-scale=1" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-  <title>Accelerate ResNet50 Training by XPUAutoShard on Intel GPU &mdash; Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation</title>
+  <title>Accelerate ResNet50 Training by XPUAutoShard on Intel GPU &mdash; Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation</title>
       <link rel="stylesheet" type="text/css" href="../../_static/pygments.css?v=fa44fd50" />
       <link rel="stylesheet" type="text/css" href="../../_static/css/theme.css?v=19f00094" />
       <link rel="stylesheet" type="text/css" href="../../_static/custom.css?v=439db15d" />
@@ -278,7 +278,7 @@ <h2>Example Output<a class="headerlink" href="#example-output" title="Link to th
   Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
     <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
     provided by <a href="https://readthedocs.org">Read the Docs</a>.
-   <jinja2.runtime.BlockReference object at 0x7f4a4a0f6c80> 
+   <jinja2.runtime.BlockReference object at 0x7f124ccd3070> 
   <p></p><div><a href='https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html' data-cookie-notice='true'>Cookies</a> <a href='https://www.intel.com/content/www/us/en/privacy/intel-privacy-notice.html'>| Privacy</a></div>
 
 
diff --git a/latest/genindex.html b/latest/genindex.html
index 7bd920511..645fdd0c1 100644
--- a/latest/genindex.html
+++ b/latest/genindex.html
@@ -3,7 +3,7 @@
 <head>
   <meta charset="utf-8" />
   <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-  <title>Index &mdash; Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation</title>
+  <title>Index &mdash; Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation</title>
       <link rel="stylesheet" type="text/css" href="_static/pygments.css?v=fa44fd50" />
       <link rel="stylesheet" type="text/css" href="_static/css/theme.css?v=19f00094" />
       <link rel="stylesheet" type="text/css" href="_static/custom.css?v=439db15d" />
@@ -109,7 +109,7 @@ <h1 id="index">Index</h1>
   Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
     <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
     provided by <a href="https://readthedocs.org">Read the Docs</a>.
-   <jinja2.runtime.BlockReference object at 0x7f4a4a3e7f10> 
+   <jinja2.runtime.BlockReference object at 0x7f124f02b580> 
   <p></p><div><a href='https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html' data-cookie-notice='true'>Cookies</a> <a href='https://www.intel.com/content/www/us/en/privacy/intel-privacy-notice.html'>| Privacy</a></div>
 
 
diff --git a/latest/get_started.html b/latest/get_started.html
index 79e77758b..794eedefc 100644
--- a/latest/get_started.html
+++ b/latest/get_started.html
@@ -4,7 +4,7 @@
   <meta charset="utf-8" /><meta name="viewport" content="width=device-width, initial-scale=1" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-  <title>Intel® Extension for TensorFlow* &mdash; Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation</title>
+  <title>Intel® Extension for TensorFlow* &mdash; Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation</title>
       <link rel="stylesheet" type="text/css" href="_static/pygments.css?v=fa44fd50" />
       <link rel="stylesheet" type="text/css" href="_static/css/theme.css?v=19f00094" />
       <link rel="stylesheet" type="text/css" href="_static/custom.css?v=439db15d" />
@@ -331,7 +331,7 @@ <h2>License<a class="headerlink" href="#license" title="Link to this heading">
   Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
     <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
     provided by <a href="https://readthedocs.org">Read the Docs</a>.
-   <jinja2.runtime.BlockReference object at 0x7f4a4a114910> 
+   <jinja2.runtime.BlockReference object at 0x7f124cd557e0> 
   <p></p><div><a href='https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html' data-cookie-notice='true'>Cookies</a> <a href='https://www.intel.com/content/www/us/en/privacy/intel-privacy-notice.html'>| Privacy</a></div>
 
 
diff --git a/latest/objects.inv b/latest/objects.inv
index 60ba67930..ceb808d2b 100644
Binary files a/latest/objects.inv and b/latest/objects.inv differ
diff --git a/latest/search.html b/latest/search.html
index 245bb07a8..ce93f1650 100644
--- a/latest/search.html
+++ b/latest/search.html
@@ -3,7 +3,7 @@
 <head>
   <meta charset="utf-8" />
   <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-  <title>Search &mdash; Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation</title>
+  <title>Search &mdash; Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation</title>
       <link rel="stylesheet" type="text/css" href="_static/pygments.css?v=fa44fd50" />
       <link rel="stylesheet" type="text/css" href="_static/css/theme.css?v=19f00094" />
       <link rel="stylesheet" type="text/css" href="_static/custom.css?v=439db15d" />
@@ -126,7 +126,7 @@
   Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
     <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
     provided by <a href="https://readthedocs.org">Read the Docs</a>.
-   <jinja2.runtime.BlockReference object at 0x7f4a4a0d8580> 
+   <jinja2.runtime.BlockReference object at 0x7f124c9c1ae0> 
   <p></p><div><a href='https://www.intel.com/content/www/us/en/privacy/intel-cookie-notice.html' data-cookie-notice='true'>Cookies</a> <a href='https://www.intel.com/content/www/us/en/privacy/intel-privacy-notice.html'>| Privacy</a></div>
 
 
diff --git a/latest/searchindex.js b/latest/searchindex.js
index 23a1359b2..937b65ca0 100644
--- a/latest/searchindex.js
+++ b/latest/searchindex.js
@@ -1 +1 @@
-Search.setIndex({"alltitles": {"1.  Prerequisite": [[11, "prerequisite"]], "1. Build Intel\u00ae Extension for TensorFlow* C++ library": [[34, "build-intel-extension-for-tensorflow-c-library"]], "1. Correction": [[0, "correction"]], "1. Install GPU Drivers": [[37, "install-gpu-drivers"]], "2.  Define the op interface and Register op": [[11, "define-the-op-interface-and-register-op"]], "2. Build TensorFlow Serving": [[34, "build-tensorflow-serving"]], "2. Install TensorFlow* via PyPI Wheel in Linux": [[37, "install-tensorflow-via-pypi-wheel-in-linux"]], "2. Warning": [[0, "warning"]], "3.  Register the kernels for the op": [[11, "register-the-kernels-for-the-op"]], "3. Install Intel\u00ae Extension for TensorFlow*": [[37, "install-intel-extension-for-tensorflow"]], "3. Temporary Ban": [[0, "temporary-ban"]], "4.  Implement the kernels": [[11, "implement-the-kernels"]], "4. Permanent Ban": [[0, "permanent-ban"]], "4. Verify the Installation": [[37, "verify-the-installation"]], "6.  Add the op to BUILD": [[11, "add-the-op-to-build"]], "7. Use the op in Python": [[11, "use-the-op-in-python"]], "8. Build the package": [[11, "build-the-package"]], "9.  Install and Verify": [[11, "install-and-verify"]], "Accelerate 3D-Unet Training w/o horovod for medical image segmentation on Intel GPU": [[55, "accelerate-3d-unet-training-w-o-horovod-for-medical-image-segmentation-on-intel-gpu"]], "Accelerate AlexNet by Quantization with Intel\u00ae Extension for Tensorflow*": [[45, "accelerate-alexnet-by-quantization-with-intel-extension-for-tensorflow"]], "Accelerate BERT-Large Pretraining on Intel GPU": [[51, "accelerate-bert-large-pretraining-on-intel-gpu"]], "Accelerate Deep Learning Training and Inference for Model Zoo Workloads on Intel GPU": [[50, "accelerate-deep-learning-training-and-inference-for-model-zoo-workloads-on-intel-gpu"]], "Accelerate Mask R-CNN Training on Intel GPU": [[60, "accelerate-mask-r-cnn-training-on-intel-gpu"]], "Accelerate ResNet50 Training by XPUAutoShard on Intel GPU": [[62, "accelerate-resnet50-training-by-xpuautoshard-on-intel-gpu"]], "Accuracy": [[54, "accuracy"], [57, "accuracy"]], "AdamW": [[26, "adamw"]], "Additional": [[39, "additional"]], "Additional Performance Data for Intel AI Data Center Products": [[31, "additional-performance-data-for-intel-ai-data-center-products"]], "Advanced AMP vs. Stock TensorFlow AMP": [[19, "advanced-amp-vs-stock-tensorflow-amp"]], "Advanced Auto Mixed Precision": [[19, "advanced-auto-mixed-precision"], [19, "id1"]], "Advanced Auto Mixed Precision (AMP)": [[21, "advanced-auto-mixed-precision-amp"]], "Advanced Settings": [[29, "advanced-settings"]], "Advanced: Enable Advanced AMP Method": [[47, "advanced-enable-advanced-amp-method"]], "Apply Model Quantization": [[49, "apply-model-quantization"]], "Apply Patch": [[61, "apply-patch"]], "Apply Patch for Intel GPU": [[58, "apply-patch-for-intel-gpu"]], "Architecture": [[23, "architecture"]], "Attribution": [[0, "attribution"]], "Auto Mixed Precision Options": [[20, "auto-mixed-precision-options"]], "BERT Training for Classifying Text on Intel CPU and GPU": [[56, "bert-training-for-classifying-text-on-intel-cpu-and-gpu"]], "BERT-Large Phase2 Training Performance Results": [[31, "bert-large-phase2-training-performance-results"]], "BF16 + FP8 Fine-tuning": [[57, "bf16-fp8-fine-tuning"]], "Backend and Config Protocol": [[20, "backend-and-config-protocol"]], "Background": [[18, "background"], [45, "background"], [52, "background"]], "Basic Settings": [[29, "basic-settings"]], "Basic fusion": [[24, "basic-fusion"]], "Binaries Preparation": [[2, "binaries-preparation"]], "Build Docker container from Dockerfile": [[41, "build-docker-container-from-dockerfile"], [42, "build-docker-container-from-dockerfile"]], "Build Docker image from Dockerfile": [[34, "build-docker-image-from-dockerfile"]], "Build Intel\u00ae Extension for TensorFlow* CC library": [[40, "build-intel-extension-for-tensorflow-cc-library"]], "Build Intel\u00ae Extension for TensorFlow* PyPI": [[39, "build-intel-extension-for-tensorflow-pypi"]], "Build Source Code": [[39, "build-source-code"], [40, "build-source-code"]], "Build and run": [[40, "build-and-run"]], "Build from source": [[14, "build-from-source"], [34, "build-from-source"]], "Build the Docker Image": [[3, "build-the-docker-image"]], "Build to Local Test": [[5, "build-to-local-test"]], "Building the model": [[28, "building-the-model"]], "C++ coding style": [[7, "c-coding-style"]], "CPU": [[52, "cpu"]], "CPU Launcher [Experimental]": [[21, "cpu-launcher-experimental"]], "CPU Practice Guide": [[32, "cpu-practice-guide"]], "Check Currently Used Device Type": [[30, "check-currently-used-device-type"]], "Check Device Count (Optional)": [[58, "check-device-count-optional"]], "Check Intel\u00ae Advanced Matrix Extensions": [[52, "check-intel-advanced-matrix-extensions"]], "Check Intel\u00ae Deep Learning Boost": [[52, "check-intel-deep-learning-boost"]], "Check the Environment for XPU": [[42, "check-the-environment-for-xpu"]], "Clone Horovod Repo": [[58, "clone-horovod-repo"]], "Clone the Repository": [[47, "clone-the-repository"]], "Code": [[53, "code"]], "Code Structure": [[17, "code-structure"]], "Code style guide": [[7, "code-style-guide"]], "Command": [[61, "command"]], "Command with Horovod": [[61, "command-with-horovod"]], "Commands": [[51, "commands"]], "Common Execution Mode": [[29, "common-execution-mode"]], "Common Guide for Running": [[46, "common-guide-for-running"]], "Common Requirements": [[39, "common-requirements"], [40, "common-requirements"]], "Compatibility Table": [[63, "compatibility-table"]], "Conda Environment Installation Instructions": [[38, "conda-environment-installation-instructions"]], "Configuration": [[31, "configuration"], [52, "configuration"]], "Configuration List": [[18, "configuration-list"]], "Configuration via Environment Variables": [[20, "configuration-via-environment-variables"]], "Configure": [[39, "configure"], [40, "configure"]], "Configure Example For XPU": [[39, "configure-example-for-xpu"]], "Configure Example for CPU": [[39, "configure-example-for-cpu"]], "Configure For CPU": [[39, "configure-for-cpu"], [40, "configure-for-cpu"]], "Configure For GPU": [[40, "configure-for-gpu"]], "Configure For XPU": [[39, "configure-for-xpu"]], "Contributing": [[63, "contributing"]], "Contributing guidelines": [[7, "contributing-guidelines"]], "Contributing to Intel\u00ae Extension for TensorFlow*": [[7, "contributing-to-intel-extension-for-tensorflow"]], "Contributor Covenant Code of Conduct": [[0, "contributor-covenant-code-of-conduct"]], "Convergence": [[51, "convergence"]], "Create Release Version": [[5, "create-release-version"]], "Create Virtual Environment": [[58, "create-virtual-environment"]], "Create a Conda Environment": [[39, "create-a-conda-environment"], [40, "create-a-conda-environment"]], "Custom API": [[23, "custom-api"]], "Custom Operation": [[19, "custom-operation"]], "Customized Operators": [[25, "customized-operators"]], "Data Type": [[19, "data-type"]], "Default memory allocator": [[29, "default-memory-allocator"]], "Dense Layer": [[26, "dense-layer"]], "Dependency": [[58, "dependency"]], "Description": [[2, "description"], [3, "description"]], "Developing Intel\u00ae Extension for TensorFlow*": [[7, "developing-intel-extension-for-tensorflow"]], "Directory Tree Structure": [[9, "directory-tree-structure"]], "Disable Constant Folding Function": [[52, "disable-constant-folding-function"]], "Distributed Training Example with Intel\u00ae Optimization for Horovod* on Intel\u00ae GPU": [[58, "distributed-training-example-with-intel-optimization-for-horovod-on-intel-gpu"]], "Documentation": [[4, "documentation"], [63, "documentation"]], "Documentation style guide": [[7, "documentation-style-guide"]], "Download Jupyter Code:": [[56, "download-jupyter-code"]], "Download Patch": [[58, "download-patch"]], "Download Source Code": [[39, "download-source-code"], [40, "download-source-code"]], "Download the Pretrained-model": [[47, "download-the-pretrained-model"]], "Dump the graph": [[17, "dump-the-graph"]], "Ease-of-use Python API": [[21, "ease-of-use-python-api"]], "EfficientNet-B0 Inference Performance Results": [[31, "efficientnet-b0-inference-performance-results"]], "EfficientNet-B3 Inference Performance Results": [[31, "efficientnet-b3-inference-performance-results"]], "Enable Advanced AMP": [[19, "enable-advanced-amp"]], "Enable Running Environment": [[47, "enable-running-environment"], [48, "enable-running-environment"], [51, "enable-running-environment"], [54, "enable-running-environment"], [55, "enable-running-environment"], [56, "enable-running-environment"], [57, "enable-running-environment"], [60, "enable-running-environment"], [61, "enable-running-environment"], [62, "enable-running-environment"]], "Enable Virtual Running Environment": [[46, "enable-virtual-running-environment"]], "Enable oneAPI": [[58, "enable-oneapi"]], "Enable oneAPI Running Environment": [[46, "enable-oneapi-running-environment"]], "Enable oneDNN Graph": [[52, "enable-onednn-graph"]], "End-to-end Example": [[18, "end-to-end-example"]], "Enforcement": [[0, "enforcement"]], "Enforcement Guidelines": [[0, "enforcement-guidelines"]], "Enforcement Responsibilities": [[0, "enforcement-responsibilities"]], "Environment Variable Configuration": [[47, "environment-variable-configuration"]], "Environment Variable Difference with Stock TensorFlow": [[18, "environment-variable-difference-with-stock-tensorflow"]], "Environment Variables": [[20, "environment-variables"], [29, "environment-variables"]], "Environment Variables with Python APIs": [[20, "environment-variables-with-python-apis"]], "Environment Vasriable": [[54, "environment-vasriable"]], "Example": [[16, "example"], [18, "example"], [19, "example"], [35, "example"], [40, "example"]], "Example Output": [[48, "example-output"], [53, "example-output"], [54, "example-output"], [62, "example-output"]], "Example Output with hvd": [[61, "example-output-with-hvd"]], "Example Output without hvd": [[61, "example-output-without-hvd"]], "Example of Mix Precision by List": [[18, "example-of-mix-precision-by-list"]], "Example:": [[22, "example"]], "Examples": [[17, "examples"], [29, "examples"], [44, "examples"], [44, "id1"]], "Execute": [[45, "execute"], [56, "execute"]], "Execute Testing and Comparing the Performance of FP32 and Advanced AMP on CPU and GPU in Docker Container or Bare Metal": [[47, "execute-testing-and-comparing-the-performance-of-fp32-and-advanced-amp-on-cpu-and-gpu-in-docker-container-or-bare-metal"]], "Execute the Example": [[51, "execute-the-example"], [55, "execute-the-example"], [57, "execute-the-example"], [60, "execute-the-example"]], "Executes the Example with Python API": [[48, "executes-the-example-with-python-api"], [54, "executes-the-example-with-python-api"], [62, "executes-the-example-with-python-api"]], "Executing Command": [[62, "executing-command"]], "Execution": [[58, "execution"], [61, "execution"]], "Experimental Release": [[37, "experimental-release"]], "Experimental: Intel\u00ae Arc\u2122 A-Series GPU Software Installation": [[37, "experimental-intel-arc-a-series-gpu-software-installation"]], "Extension Design": [[10, "extension-design"]], "Extra Requirements for XPU Build Only": [[39, "extra-requirements-for-xpu-build-only"]], "Extra Requirements for XPU/GPU Build Only": [[40, "extra-requirements-for-xpu-gpu-build-only"]], "FAQ": [[22, "faq"], [47, "faq"], [48, "faq"], [51, "faq"], [54, "faq"], [55, "faq"], [56, "faq"], [57, "faq"], [60, "faq"]], "FP16 Inference": [[54, "fp16-inference"]], "FP32 Inference": [[54, "fp32-inference"]], "FP8 BERT-Large Fine-tuning for Classifying Text on Intel GPU": [[57, "fp8-bert-large-fine-tuning-for-classifying-text-on-intel-gpu"]], "Feature": [[19, "feature"]], "Features": [[21, "features"]], "Finetune Command": [[51, "finetune-command"]], "Frequently Asked Questions": [[14, "frequently-asked-questions"]], "Further Settings": [[62, "further-settings"]], "GNU OpenMP": [[32, "gnu-openmp"]], "GPU": [[45, "gpu"], [52, "gpu"]], "GPU Practice Guide": [[32, "gpu-practice-guide"]], "GPU Profiler": [[21, "gpu-profiler"], [22, "gpu-profiler"]], "Gelu Activation": [[26, "gelu-activation"]], "Generic layout optimizer": [[24, "generic-layout-optimizer"]], "Get docker container from dockerhub": [[41, "get-docker-container-from-dockerhub"], [42, "get-docker-container-from-dockerhub"]], "Graph Optimization": [[21, "graph-optimization"]], "Graph Optimizer": [[19, "graph-optimizer"]], "Graph fusion": [[24, "graph-fusion"]], "Hardware Configuration": [[31, "hardware-configuration"], [32, "hardware-configuration"]], "Hardware Configuration for Intel Flex 170 GPU": [[31, "hardware-configuration-for-intel-flex-170-gpu"]], "Hardware Configuration for Intel Max 1550 GPU": [[31, "hardware-configuration-for-intel-max-1550-gpu"]], "Hardware Environment": [[45, "hardware-environment"], [52, "hardware-environment"]], "Hardware Requirement": [[47, "hardware-requirement"], [63, "hardware-requirement"]], "Hardware Requirements": [[37, "hardware-requirements"], [39, "hardware-requirements"], [40, "hardware-requirements"], [41, "hardware-requirements"], [42, "hardware-requirements"], [51, "hardware-requirements"], [54, "hardware-requirements"], [55, "hardware-requirements"], [56, "hardware-requirements"], [57, "hardware-requirements"], [60, "hardware-requirements"], [61, "hardware-requirements"], [62, "hardware-requirements"]], "Highlights": [[4, "highlights"]], "How it works": [[16, "how-it-works"]], "How to identify different hardware types?": [[28, "how-to-identify-different-hardware-types"]], "How to write custom op": [[11, "how-to-write-custom-op"]], "I. Binaries Preparation": [[3, "i-binaries-preparation"]], "I. Customize Build Script": [[2, "i-customize-build-script"]], "I. Use all physical cores": [[29, "i-use-all-physical-cores"]], "II. Build the Container": [[2, "ii-build-the-container"], [3, "ii-build-the-container"]], "II. Use all cores including logical cores": [[29, "ii-use-all-cores-including-logical-cores"]], "III. Running the Container": [[2, "iii-running-the-container"]], "III. Use physical cores on one node": [[29, "iii-use-physical-cores-on-one-node"]], "INT8 Quantization": [[15, "int8-quantization"], [21, "int8-quantization"]], "ITEX_VERBOSE level definition": [[20, "itex-verbose-level-definition"]], "IV. Use your designated number of cores": [[29, "iv-use-your-designated-number-of-cores"]], "IX. Set environment variable TF_NUM_INTRAOP_THREADS": [[29, "ix-set-environment-variable-tf-num-intraop-threads"]], "If not use Horovod": [[61, "if-not-use-horovod"]], "If use Horovod": [[61, "if-use-horovod"]], "Implementation Details": [[24, "implementation-details"]], "Incompatible Changes": [[8, "incompatible-changes"]], "Inference Performance Results": [[31, "inference-performance-results"]], "Inference Performance on 1x Intel Data Center GPU Flex 170": [[31, "inference-performance-on-1x-intel-data-center-gpu-flex-170"]], "Inference Workloads": [[31, "inference-workloads"]], "Infrastructure": [[23, "infrastructure"]], "Install": [[58, "install"], [63, "install"]], "Install Bazel": [[39, "install-bazel"], [40, "install-bazel"]], "Install Clang-17 compiler": [[39, "install-clang-17-compiler"]], "Install GPU Drivers": [[42, "install-gpu-drivers"]], "Install Intel GPU Driver": [[39, "install-intel-gpu-driver"], [40, "install-intel-gpu-driver"]], "Install Intel\u00ae Extension for TensorFlow*": [[41, "install-intel-extension-for-tensorflow"], [42, "install-intel-extension-for-tensorflow"]], "Install Intel\u00ae Extension for Tensorflow*": [[49, "install-intel-extension-for-tensorflow"]], "Install Intel\u00ae Neural Compressor": [[49, "install-intel-neural-compressor"]], "Install Model Server": [[34, "install-model-server"]], "Install Other Required Packages": [[62, "install-other-required-packages"]], "Install TensorFlow": [[37, "install-tensorflow"], [39, "install-tensorflow"], [40, "install-tensorflow"], [41, "install-tensorflow"], [42, "install-tensorflow"]], "Install TensorFlow Serving with Intel\u00ae Extension for TensorFlow*": [[34, "install-tensorflow-serving-with-intel-extension-for-tensorflow"]], "Install for CPU": [[63, "install-for-cpu"]], "Install for CPU weekly": [[63, "install-for-cpu-weekly"]], "Install for XPU": [[63, "install-for-xpu"]], "Install for XPU weekly": [[63, "install-for-xpu-weekly"]], "Install for weekly binaries": [[63, "install-for-weekly-binaries"]], "Install oneAPI Base Toolkit": [[39, "install-oneapi-base-toolkit"], [40, "install-oneapi-base-toolkit"]], "Install oneAPI Base Toolkit Packages": [[42, "install-oneapi-base-toolkit-packages"]], "Install using Docker": [[34, "install-using-docker"]], "Install via Docker container": [[41, "install-via-docker-container"], [42, "install-via-docker-container"]], "Install via PyPI wheel in bare metal": [[41, "install-via-pypi-wheel-in-bare-metal"], [42, "install-via-pypi-wheel-in-bare-metal"]], "Installation": [[53, "installation"]], "Installation Channel:": [[63, "installation-channel"]], "Installation Guide": [[43, "installation-guide"]], "Instance Normalization": [[26, "instance-normalization"]], "Integrate the CC library": [[40, "integrate-the-cc-library"]], "Intel Advanced Feature and Extension Management": [[23, "intel-advanced-feature-and-extension-management"]], "Intel CPU Software Installation": [[41, "intel-cpu-software-installation"]], "Intel GPU Driver": [[46, "intel-gpu-driver"]], "Intel OpenMP": [[32, "intel-openmp"]], "Intel XPU Software Installation": [[42, "intel-xpu-software-installation"]], "Intel\u00ae DevCloud": [[45, "intel-devcloud"], [52, "intel-devcloud"]], "Intel\u00ae Extension for TensorFlow*": [[63, "intel-extension-for-tensorflow"]], "Intel\u00ae Extension for TensorFlow* Config Protocol": [[33, "intel-extension-for-tensorflow-config-protocol"]], "Intel\u00ae Extension for TensorFlow* Docker Container Guide": [[2, "intel-extension-for-tensorflow-docker-container-guide"]], "Intel\u00ae Extension for TensorFlow* Serving - Docker Container Guide": [[3, "intel-extension-for-tensorflow-serving-docker-container-guide"]], "Intel\u00ae Extension for TensorFlow* for C++": [[40, "intel-extension-for-tensorflow-for-c"]], "Intel\u00ae Extension for Tensorflow* Model Quantization API Example": [[49, "intel-extension-for-tensorflow-model-quantization-api-example"]], "Intel\u00ae Extension for Tensorflow* Version": [[52, "intel-extension-for-tensorflow-version"]], "Intel\u00ae oneAPI Base Toolkit": [[46, "intel-oneapi-base-toolkit"]], "Introduction": [[5, "introduction"], [13, "introduction"], [23, "introduction"], [45, "introduction"], [47, "introduction"], [50, "introduction"], [51, "introduction"], [52, "introduction"], [54, "introduction"], [55, "introduction"], [56, "introduction"], [57, "introduction"], [60, "introduction"], [61, "introduction"], [62, "introduction"]], "Jemalloc": [[29, "jemalloc"]], "Keras 3 Overview": [[27, "keras-3-overview"]], "Keras Mixed Precision": [[28, "keras-mixed-precision"]], "Known Issues": [[8, "known-issues"]], "LSTM": [[26, "lstm"]], "Latency mode": [[29, "latency-mode"]], "Launch Log": [[29, "launch-log"]], "Launch Script User Guide": [[29, "launch-script-user-guide"]], "Layer Normalization": [[26, "layer-normalization"]], "License": [[52, "license"], [63, "license"]], "Limitation": [[36, "limitation"]], "Linker": [[40, "linker"]], "Load": [[40, "load"]], "Local Server": [[45, "local-server"], [52, "local-server"]], "Log and Save Optimized Graph": [[19, "log-and-save-optimized-graph"]], "Loss scaling": [[28, "loss-scaling"]], "Loss scaling overview": [[28, "loss-scaling-overview"]], "Mask-RCNN Inference Performance Results": [[31, "mask-rcnn-inference-performance-results"]], "Mask-RCNN Training Performance Results": [[31, "mask-rcnn-training-performance-results"]], "Medical Image 3D U-Net Training Performance Results": [[31, "medical-image-3d-u-net-training-performance-results"]], "Memory Allocator": [[29, "memory-allocator"], [32, "memory-allocator"]], "Memory Layout format": [[32, "memory-layout-format"]], "Mixed data type fusion": [[24, "mixed-data-type-fusion"]], "Model Code change": [[51, "model-code-change"], [54, "model-code-change"], [55, "model-code-change"], [57, "model-code-change"], [60, "model-code-change"], [61, "model-code-change"]], "Models": [[31, "models"]], "Multi-instance": [[29, "multi-instance"]], "Multi-tile with horovod": [[55, "multi-tile-with-horovod"]], "Multiple instances for inference": [[29, "multiple-instances-for-inference"]], "NUMA Control": [[29, "numa-control"]], "Native Linux Running Directly on Hardware": [[37, "native-linux-running-directly-on-hardware"], [37, "id2"]], "NextPluggableDevice Architecture": [[30, "nextpluggabledevice-architecture"]], "NextPluggableDevice Overview": [[30, "nextpluggabledevice-overview"]], "Non-Uniform Memory Access (NUMA)": [[32, "non-uniform-memory-access-numa"]], "Notes": [[53, "notes"]], "Notice": [[19, "notice"]], "Numactl": [[32, "numactl"]], "Numeric Stability": [[18, "numeric-stability"]], "OMP_NUM_THREADS": [[32, "omp-num-threads"]], "Objectives": [[16, "objectives"]], "Online Documentation Build Guide": [[5, "online-documentation-build-guide"]], "Online Weight Prepack": [[36, "online-weight-prepack"]], "OpenMP": [[32, "openmp"]], "OpenXLA": [[16, "openxla"]], "OpenXLA PJRT Plugin": [[30, "openxla-pjrt-plugin"]], "OpenXLA Support on GPU [Experimental]": [[21, "openxla-support-on-gpu-experimental"]], "Operator Optimization": [[21, "operator-optimization"]], "Operators Override": [[26, "operators-override"]], "Optimization in convolution": [[13, "optimization-in-convolution"]], "Optimizations Design": [[12, "optimizations-design"]], "Option 1: Extract from Tensorflow* python package (Recommended)": [[40, "option-1-extract-from-tensorflow-python-package-recommended"]], "Option 2: Build from TensorFlow* source code": [[40, "option-2-build-from-tensorflow-source-code"]], "Optional Requirements for CPU Build Only": [[39, "optional-requirements-for-cpu-build-only"]], "Optional: Install Full Intel\u00ae oneAPI": [[37, "optional-install-full-intel-oneapi"]], "Original Code": [[19, "original-code"]], "Our Pledge": [[0, "our-pledge"]], "Our Standards": [[0, "our-standards"]], "Output": [[58, "output"]], "Overview": [[15, "overview"], [16, "overview"], [17, "overview"], [19, "overview"], [20, "overview"], [28, "overview"], [29, "overview"], [31, "overview"], [32, "overview"], [33, "overview"], [36, "overview"], [39, "overview"], [49, "overview"]], "Performance Data": [[31, "performance-data"]], "Practice Guide": [[32, "practice-guide"]], "Preconditions": [[38, "preconditions"]], "Prepare": [[46, "prepare"]], "Prepare Dataset": [[49, "prepare-dataset"], [51, "prepare-dataset"], [55, "prepare-dataset"], [60, "prepare-dataset"]], "Prepare Example Code": [[58, "prepare-example-code"]], "Prepare ImageNet dataset": [[61, "prepare-imagenet-dataset"]], "Prepare Pre-Trained Model": [[49, "prepare-pre-trained-model"]], "Prepare Tensorflow* CC library and header files": [[40, "prepare-tensorflow-cc-library-and-header-files"]], "Prepare for GPU": [[51, "prepare-for-gpu"], [55, "prepare-for-gpu"], [57, "prepare-for-gpu"], [60, "prepare-for-gpu"], [62, "prepare-for-gpu"]], "Prepare for GPU (Skip this Step for CPU)": [[47, "prepare-for-gpu-skip-this-step-for-cpu"]], "Prepare for GPU (Skip this step for CPU)": [[48, "prepare-for-gpu-skip-this-step-for-cpu"], [54, "prepare-for-gpu-skip-this-step-for-cpu"], [56, "prepare-for-gpu-skip-this-step-for-cpu"], [61, "prepare-for-gpu-skip-this-step-for-cpu"]], "Prepare for Running": [[44, "prepare-for-running"]], "Prepare the Codes": [[62, "prepare-the-codes"]], "Prerequisite: import intel_extension_for_tensorflow as itex": [[33, "prerequisite-import-intel-extension-for-tensorflow-as-itex"]], "Prerequisites": [[48, "prerequisites"], [51, "prerequisites"], [51, "id1"], [51, "id2"], [54, "prerequisites"], [55, "prerequisites"], [56, "prerequisites"], [57, "prerequisites"], [60, "prerequisites"], [61, "prerequisites"], [62, "prerequisites"]], "Pretraining Command": [[51, "pretraining-command"]], "Python API": [[17, "python-api"], [18, "python-api"], [47, "python-api"], [62, "python-api"]], "Python API Attribute & Environment Variable": [[18, "python-api-attribute-environment-variable"]], "Python APIs": [[33, "python-apis"]], "Python APIs and Environment Variable Names": [[33, "python-apis-and-environment-variable-names"]], "Python APIs and preserved environment variable Names": [[33, "python-apis-and-preserved-environment-variable-names"]], "Python Unit Testing": [[7, "python-unit-testing"]], "Python coding style": [[7, "python-coding-style"]], "Quantize Inception V3 by Intel\u00ae Extension for Tensorflow* on Intel\u00ae Xeon\u00ae": [[52, "quantize-inception-v3-by-intel-extension-for-tensorflow-on-intel-xeon"]], "Quick Example on Intel CPU and GPU": [[53, "quick-example-on-intel-cpu-and-gpu"]], "Quick Start Guide": [[50, "quick-start-guide"]], "Quick Training Example": [[19, "quick-training-example"]], "Refer to train_resnet50": [[59, "refer-to-train-resnet50"]], "Reference": [[36, "reference"]], "References": [[16, "references"]], "Releases": [[8, "releases"]], "Report a Vulnerability": [[1, "report-a-vulnerability"]], "Requirements": [[39, "requirements"], [40, "requirements"]], "ResNet50 Inference on Intel CPU and GPU": [[48, "resnet50-inference-on-intel-cpu-and-gpu"]], "ResNet50v1-5 Inference Performance Results": [[31, "resnet50v1-5-inference-performance-results"]], "ResNet50v1-5 Training Performance Results": [[31, "resnet50v1-5-training-performance-results"]], "Resnet50 train on Intel GPU": [[61, "resnet50-train-on-intel-gpu"]], "Resources": [[10, "resources"], [63, "resources"]], "Result": [[47, "result"]], "Results": [[51, "results"]], "Rule to Improve Performance by the Configuration List": [[18, "rule-to-improve-performance-by-the-configuration-list"]], "Run Model Quantization Example:": [[49, "run-model-quantization-example"]], "Run Models in the Docker Container": [[50, "run-models-in-the-docker-container"]], "Run Models on Bare Metal": [[50, "run-models-on-bare-metal"]], "Run Script": [[46, "run-script"]], "Run sample": [[34, "run-sample"]], "Running": [[46, "running"]], "Running Command": [[58, "running-command"]], "Running Environment": [[45, "running-environment"], [52, "running-environment"]], "Running the Container": [[3, "running-the-container"]], "Running the Jupyter Notebook": [[54, "running-the-jupyter-notebook"]], "Runtime": [[14, "runtime"]], "Runtime Switch of NextPluggableDevice and PluggableDevice": [[30, "runtime-switch-of-nextpluggabledevice-and-pluggabledevice"]], "Scope": [[0, "scope"]], "Security": [[63, "security"]], "Security Policy": [[1, "security-policy"]], "Selecting Thread Pool in Intel\u00ae Extension for TensorFlow* CPU [Experimental]": [[35, "selecting-thread-pool-in-intel-extension-for-tensorflow-cpu-experimental"]], "Set Model Parameters": [[61, "set-model-parameters"]], "Set Up Software Environment": [[49, "set-up-software-environment"]], "Set environment variables for inference": [[29, "set-environment-variables-for-inference"]], "Set up Base Running Environment": [[45, "set-up-base-running-environment"]], "Set up Intel\u00ae Extension for Tensorflow* for GPU": [[45, "set-up-intel-extension-for-tensorflow-for-gpu"]], "Setting the dtype policy": [[28, "setting-the-dtype-policy"]], "Setup": [[19, "setup"], [28, "setup"]], "Setup PYTHONPATH": [[62, "setup-pythonpath"]], "Setup Running Environment": [[46, "setup-running-environment"], [47, "setup-running-environment"], [48, "setup-running-environment"], [51, "setup-running-environment"], [54, "setup-running-environment"], [55, "setup-running-environment"], [56, "setup-running-environment"], [57, "setup-running-environment"], [58, "setup-running-environment"], [60, "setup-running-environment"], [61, "setup-running-environment"]], "Setup environment variables": [[37, "setup-environment-variables"], [42, "setup-environment-variables"]], "Sharding Parameters Setting": [[62, "sharding-parameters-setting"]], "Single Tile": [[55, "single-tile"]], "Single instance for inference": [[29, "single-instance-for-inference"]], "Situations leads to warning or Error": [[27, "situations-leads-to-warning-or-error"]], "Software Configuration": [[31, "software-configuration"], [32, "software-configuration"]], "Software Configuration for Intel Flex 170 GPU": [[31, "software-configuration-for-intel-flex-170-gpu"]], "Software Configuration for Intel Max 1550 GPU": [[31, "software-configuration-for-intel-max-1550-gpu"]], "Software Requirement": [[63, "software-requirement"]], "Software Requirements": [[37, "software-requirements"], [41, "software-requirements"], [42, "software-requirements"]], "Speed up Inference of Inception v4 by Advanced Automatic Mixed Precision on Intel CPU and GPU via Docker Container or Bare Metal": [[47, "speed-up-inference-of-inception-v4-by-advanced-automatic-mixed-precision-on-intel-cpu-and-gpu-via-docker-container-or-bare-metal"]], "Stable Diffusion Inference for Text2Image on Intel GPU": [[54, "stable-diffusion-inference-for-text2image-on-intel-gpu"]], "Stable Diffusion v1-4 Inference Performance Results": [[31, "stable-diffusion-v1-4-inference-performance-results"]], "Start with XLA using NextPluggableDevice": [[30, "start-with-xla-using-nextpluggabledevice"]], "Startup Jupyter Notebook": [[52, "startup-jupyter-notebook"], [56, "startup-jupyter-notebook"]], "Step": [[47, "step"]], "Step by step instructions:": [[38, "step-by-step-instructions"]], "Step-By-Step Instructions": [[37, "step-by-step-instructions"]], "Support": [[63, "support"]], "System environment install": [[37, "system-environment-install"], [41, "system-environment-install"], [42, "system-environment-install"]], "TCMalloc": [[29, "tcmalloc"], [32, "tcmalloc"]], "Table of Contents": [[32, "table-of-contents"]], "TensorFlow Public API": [[23, "tensorflow-public-api"]], "TensorFlow Serving": [[21, "tensorflow-serving"]], "Throughput mode": [[29, "throughput-mode"]], "Tips": [[19, "tips"]], "Tips and Debugging": [[7, "tips-and-debugging"]], "Training Accuracy Results": [[31, "training-accuracy-results"]], "Training Accuracy on 1-node of 4x Intel Data Center GPU Max 1550": [[31, "training-accuracy-on-1-node-of-4x-intel-data-center-gpu-max-1550"]], "Training Performance Results": [[31, "training-performance-results"]], "Training Performance on 1-node of 4x Intel Data Center GPU Max 1550": [[31, "training-performance-on-1-node-of-4x-intel-data-center-gpu-max-1550"]], "Training Workloads": [[31, "training-workloads"]], "Training the model with Model.fit": [[28, "training-the-model-with-model-fit"]], "Training the model with a custom training loop": [[28, "training-the-model-with-a-custom-training-loop"]], "Troubleshooting": [[14, "troubleshooting"]], "Tune Advanced AMP Manually": [[19, "tune-advanced-amp-manually"]], "Tune Advanced Auto Mixed Precision": [[18, "tune-advanced-auto-mixed-precision"]], "Tuning Performance Example on MobileNet": [[18, "tuning-performance-example-on-mobilenet"]], "Ubuntu Linux Installed in WSL2": [[37, "ubuntu-linux-installed-in-wsl2"]], "Underflow and Overflow": [[28, "underflow-and-overflow"]], "Unit testing": [[7, "unit-testing"]], "Update latest Version": [[5, "update-latest-version"]], "Usage": [[15, "usage"], [17, "usage"], [18, "usage"], [18, "id1"], [19, "usage"], [22, "usage"], [26, "usage"]], "Usage & Effect": [[36, "usage-effect"]], "Usage of Docker Container": [[2, "usage-of-docker-container"]], "Usage of TCMalloc/Jemalloc/Default memory allocator": [[29, "usage-of-tcmalloc-jemalloc-default-memory-allocator"]], "Use Case with different performance": [[27, "use-case-with-different-performance"]], "Using Eigen Thread Pool": [[35, "using-eigen-thread-pool"]], "Using OpenMP Thread Pool": [[35, "using-openmp-thread-pool"]], "V. Throughput mode": [[29, "v-throughput-mode"]], "VI. Latency mode": [[29, "vi-latency-mode"]], "VII. Your designated number of instances": [[29, "vii-your-designated-number-of-instances"]], "VIII. Your designated number of instances and instance index": [[29, "viii-your-designated-number-of-instances-and-instance-index"]], "Verify That Intel GPU is Accessible From TensorFlow": [[2, "verify-that-intel-gpu-is-accessible-from-tensorflow"]], "Verify the Installation": [[41, "verify-the-installation"], [42, "verify-the-installation"]], "Virtual environment install": [[37, "virtual-environment-install"], [41, "virtual-environment-install"], [42, "virtual-environment-install"]], "Welcome to Intel \u00ae Extension for TensorFlow* documentation!": [[6, "welcome-to-intel-extension-for-tensorflow-documentation"], [64, "welcome-to-intel-extension-for-tensorflow-documentation"]], "Welcome to Intel\u00ae Extension for TensorFlow* documentation": [[4, "welcome-to-intel-extension-for-tensorflow-documentation"]], "Why NextPluggableDevice": [[30, "why-nextpluggabledevice"]], "Windows GPU Drivers": [[37, "windows-gpu-drivers"]], "Windows Subsystem for Linux 2 (WSL2)": [[37, "windows-subsystem-for-linux-2-wsl2"], [37, "id1"]], "With XPUAutoShard": [[62, "with-xpuautoshard"]], "Without XPUAutoShard": [[62, "without-xpuautoshard"]], "Workflow": [[10, "workflow"], [15, "workflow"], [17, "workflow"], [36, "workflow"]], "X. Set environment variable TF_NUM_INTEROP_THREADS": [[29, "x-set-environment-variable-tf-num-interop-threads"]], "XPU Engine": [[23, "xpu-engine"]], "XPU for CPU only platform (Deprecated)": [[42, "xpu-for-cpu-only-platform-deprecated"]], "XPUAutoShard on GPU [Experimental]": [[17, "xpuautoshard-on-gpu-experimental"], [21, "xpuautoshard-on-gpu-experimental"]], "bazel style guide": [[7, "bazel-style-guide"]], "itex graph": [[33, "itex-graph"]], "itex operators": [[33, "itex-operators"]], "itex ops override": [[33, "itex-ops-override"]], "itex version": [[33, "itex-version"]], "itex.AutoMixedPrecisionOptions": [[33, "itex-automixedprecisionoptions"]], "itex.ConfigProto": [[33, "itex-configproto"]], "itex.DebugOptions": [[33, "itex-debugoptions"]], "itex.GPUOptions": [[33, "itex-gpuoptions"]], "itex.GraphOptions": [[33, "itex-graphoptions"]], "itex.ShardingConfig": [[33, "itex-shardingconfig"]], "itex.get_config": [[33, "itex-get-config"]], "itex.ops.AdamWithWeightDecayOptimizer": [[25, "itex-ops-adamwithweightdecayoptimizer"]], "itex.ops.GroupNormalization": [[25, "itex-ops-groupnormalization"]], "itex.ops.ItexLSTM": [[25, "itex-ops-itexlstm"]], "itex.ops.LAMBOptimizer": [[25, "itex-ops-lamboptimizer"]], "itex.ops.LayerNormalization": [[25, "itex-ops-layernormalization"]], "itex.ops.gelu": [[25, "itex-ops-gelu"]], "itex.set_config": [[33, "itex-set-config"]], "oneDNN object cache optimization": [[13, "onednn-object-cache-optimization"]], "quick_example.py": [[53, "quick-example-py"]]}, "docnames": ["CODE_OF_CONDUCT", "SECURITY", "docker/README", "docker/tensorflow-serving/README", "docs/README", "docs/build_docs/docs_build_tips", "docs/build_docs/source/index", "docs/community/contributing", "docs/community/releases", "docs/design/directory_structure", "docs/design/extension_design", "docs/design/how_to_write_custom_op", "docs/design/optimization/README", "docs/design/optimization/oneDNN_object_cache", "docs/guide/FAQ", "docs/guide/INT8_quantization", "docs/guide/OpenXLA", "docs/guide/XPUAutoShard", "docs/guide/aamp_tune", "docs/guide/advanced_auto_mixed_precision", "docs/guide/environment_variables", "docs/guide/features", "docs/guide/how_to_enable_profiler", "docs/guide/infrastructure", "docs/guide/itex_fusion", "docs/guide/itex_ops", "docs/guide/itex_ops_override", "docs/guide/keras3_support", "docs/guide/keras_mixed_precision", "docs/guide/launch", "docs/guide/next_pluggable_device", "docs/guide/performance", "docs/guide/practice_guide", "docs/guide/python_api", "docs/guide/tf_serving_install", "docs/guide/threadpool", "docs/guide/weight_prepack", "docs/install/experimental/install_for_arc_gpu", "docs/install/experimental/install_for_gpu_conda", "docs/install/how_to_build", "docs/install/install_for_cpp", "docs/install/install_for_cpu", "docs/install/install_for_xpu", "docs/install/installation_guide", "examples/README", "examples/accelerate_alexnet_by_quantization/README", "examples/common_guide_running", "examples/infer_inception_v4_amp/README", "examples/infer_resnet50/README", "examples/itex_quantization_example/README", "examples/model_zoo_example/README", "examples/pretrain_bert/README", "examples/quantize_inception_v3/README", "examples/quick_example", "examples/stable_diffussion_inference/README", "examples/train_3d_unet/README", "examples/train_bert/README", "examples/train_bert_fp8/README", "examples/train_horovod/mnist/README", "examples/train_horovod/resnet50/README", "examples/train_maskrcnn/README", "examples/train_resnet50/README", "examples/train_resnet50_with_autoshard/README", "get_started", "index"], "envversion": {"sphinx": 61, "sphinx.domains.c": 3, "sphinx.domains.changeset": 1, "sphinx.domains.citation": 1, "sphinx.domains.cpp": 9, "sphinx.domains.index": 1, "sphinx.domains.javascript": 3, "sphinx.domains.math": 2, "sphinx.domains.python": 4, "sphinx.domains.rst": 2, "sphinx.domains.std": 2}, "filenames": ["CODE_OF_CONDUCT.md", "SECURITY.md", "docker/README.md", "docker/tensorflow-serving/README.md", "docs/README.md", "docs/build_docs/docs_build_tips.md", "docs/build_docs/source/index.rst", "docs/community/contributing.md", "docs/community/releases.md", "docs/design/directory_structure.md", "docs/design/extension_design.md", "docs/design/how_to_write_custom_op.md", "docs/design/optimization/README.md", "docs/design/optimization/oneDNN_object_cache.md", "docs/guide/FAQ.md", "docs/guide/INT8_quantization.md", "docs/guide/OpenXLA.md", "docs/guide/XPUAutoShard.md", "docs/guide/aamp_tune.md", "docs/guide/advanced_auto_mixed_precision.md", "docs/guide/environment_variables.md", "docs/guide/features.rst", "docs/guide/how_to_enable_profiler.md", "docs/guide/infrastructure.md", "docs/guide/itex_fusion.md", "docs/guide/itex_ops.md", "docs/guide/itex_ops_override.md", "docs/guide/keras3_support.md", "docs/guide/keras_mixed_precision.md", "docs/guide/launch.md", "docs/guide/next_pluggable_device.md", "docs/guide/performance.md", "docs/guide/practice_guide.md", "docs/guide/python_api.md", "docs/guide/tf_serving_install.md", "docs/guide/threadpool.md", "docs/guide/weight_prepack.md", "docs/install/experimental/install_for_arc_gpu.md", "docs/install/experimental/install_for_gpu_conda.md", "docs/install/how_to_build.md", "docs/install/install_for_cpp.md", "docs/install/install_for_cpu.md", "docs/install/install_for_xpu.md", "docs/install/installation_guide.rst", "examples/README.md", "examples/accelerate_alexnet_by_quantization/README.md", "examples/common_guide_running.md", "examples/infer_inception_v4_amp/README.md", "examples/infer_resnet50/README.md", "examples/itex_quantization_example/README.md", "examples/model_zoo_example/README.md", "examples/pretrain_bert/README.md", "examples/quantize_inception_v3/README.md", "examples/quick_example.md", "examples/stable_diffussion_inference/README.md", "examples/train_3d_unet/README.md", "examples/train_bert/README.md", "examples/train_bert_fp8/README.md", "examples/train_horovod/mnist/README.md", "examples/train_horovod/resnet50/README.md", "examples/train_maskrcnn/README.md", "examples/train_resnet50/README.md", "examples/train_resnet50_with_autoshard/README.md", "get_started.md", "index.rst"], "indexentries": {}, "objects": {}, "objnames": {}, "objtypes": {}, "terms": {"": [0, 4, 5, 14, 16, 18, 20, 21, 28, 31, 32, 34, 35, 39, 40, 45, 47, 49, 51, 52, 54, 55, 56, 63], "0": [2, 3, 4, 5, 11, 14, 15, 16, 19, 20, 22, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 37, 38, 39, 40, 41, 42, 45, 48, 49, 51, 52, 53, 56, 57, 58, 60, 61, 62, 63], "00": [16, 31, 42, 49, 61], "000": 28, "000000e": 51, "0001": 49, "0005": 51, "000611": 51, "001": [25, 26], "00363725": 25, "004": 51, "00404969": 25, "004888": 51, "006297": 61, "006950": 58, "00x": 31, "01": [14, 16, 26, 31, 33, 49, 61], "0113076031208038": 47, "01837550401687622": 47, "02": [16, 26, 28, 31, 61], "025180": 62, "027671": 62, "03": [29, 31, 51, 61], "037595": 51, "04": [2, 16, 31, 34, 35, 37, 39, 41, 42, 49, 56], "05": [16, 29, 31, 58], "0527704": 53, "06": [14, 16, 25, 28, 51], "061277": 28, "061301": 28, "061306": 28, "063685": 28, "063851": 28, "063865": 28, "0656753": 53, "07": [14, 16, 25, 31, 42, 61, 62], "072701": 51, "072752": 51, "072779": 51, "072805": 51, "072829": 51, "072861": 51, "072884": 51, "072928": 51, "073072": 51, "073094": 51, "073121": 51, "073183": 51, "077278": 53, "08": [16, 29, 35, 61], "089": 29, "09": [16, 29, 61], "090": 29, "0f": 11, "1": [2, 4, 5, 14, 16, 18, 19, 20, 21, 22, 25, 26, 27, 28, 29, 30, 32, 33, 35, 36, 38, 39, 42, 47, 49, 51, 52, 53, 54, 55, 56, 57, 58, 60, 61, 62, 63], "10": [2, 14, 16, 18, 19, 25, 28, 29, 35, 36, 37, 39, 40, 41, 49, 51, 52, 61, 62, 63], "100": [11, 28, 33, 39, 51], "1000": [31, 34, 55, 61], "10000": [19, 25, 28], "101": 37, "1024": [28, 31], "1024_a": 51, "1024gb": 31, "103148": 62, "105446": 51, "107809": 58, "10gbase": 31, "11": [16, 18, 29, 31, 37, 38, 39, 40, 42, 61, 63], "111": [28, 32], "112": 32, "114": [28, 58], "1146879196167": 54, "11490434": 28, "116": 14, "118": [28, 30], "118212": 53, "1193419": 53, "12": [7, 14, 16, 28, 29, 31, 42, 51, 54, 56, 58, 61, 62, 63], "1200": 61, "122": 33, "122414": 51, "122509": 51, "12278": 31, "127": [5, 34], "128": [16, 31, 47, 51, 57], "128gb": 31, "129": 29, "12_h": 51, "12e": 51, "13": [16, 40, 52, 58, 62, 63], "133": 49, "136": 29, "137": 29, "139660941027136": 61, "139898862851904": 61, "14": [28, 31, 34, 40, 49, 51, 56, 58, 61, 63], "140": [39, 40], "140348344015936": 62, "1403804": 53, "140612319840064": 61, "141": 11, "144": 29, "1445": 11, "145": [29, 61, 62], "1455178": 53, "15": [2, 7, 16, 29, 31, 35, 37, 38, 39, 40, 41, 42, 45, 51, 63], "150": 55, "15000": 25, "15031084974591766410": 2, "150400": 31, "150w": 31, "1550": 16, "156": 28, "15865526": 25, "158808": 25, "16": [18, 28, 29, 31, 33, 41, 47, 51, 61], "161625": 62, "163": 49, "163161": 58, "163517": 58, "163815": 62, "1657011814330": 18, "1657011815538": 18, "1658201": 53, "1666": 51, "1691980294577": 47, "16x64gb": 31, "17": [29, 40], "170": [39, 40, 42, 54, 57], "1704025": 53, "170intel": 47, "1729176": 53, "174": 56, "17448926295332318308": 2, "1762": 31, "1766": 31, "177216": 51, "178206": 61, "18": [16, 51, 58], "182": 31, "1846": 51, "185w": 31, "19": [29, 31, 37, 41, 42], "1900": 61, "190052": 51, "190136": 51, "190169": 51, "190193": 51, "190217": 51, "190249": 51, "190273": 51, "190343": 51, "190536": 51, "190559": 51, "190587": 51, "190668": 51, "191": 29, "192": [29, 51], "197306": 53, "198": 29, "1986": 28, "1997": 25, "1a": 40, "1ccb4fee": 38, "1e": [25, 26, 28], "1export": [18, 19], "1tb": 31, "1u": 28, "2": [2, 14, 15, 16, 17, 18, 19, 20, 24, 25, 27, 28, 29, 30, 31, 32, 33, 35, 36, 38, 39, 41, 42, 45, 47, 48, 49, 51, 52, 53, 54, 55, 57, 58, 60, 61, 62, 63], "20": [16, 29, 31, 35, 39, 41, 60, 62], "200": [25, 26, 51], "2000": [51, 61], "200m": 32, "2016": 25, "2017": [31, 60], "2018": 49, "20180905": 33, "2019": 55, "20200711": 49, "2021": 14, "2022": [28, 29, 33], "2023": [38, 42, 49, 51, 58], "20230123": 21, "2024": [14, 31, 37, 42], "206": 29, "207": 29, "21": [29, 31, 51], "210": 49, "2100": 61, "2134862": 53, "215": 29, "2155": 28, "216": 29, "217981": 42, "22": [2, 31, 34, 37, 39, 41, 42, 49, 51, 62], "2200": 61, "22355853": 48, "224": [22, 49], "22471978829632": 51, "224x224": 31, "227250": 51, "229": 29, "23": [29, 31, 42, 62], "2300": 61, "23092487755584": 51, "23450678511424": 51, "2350": 37, "24": [29, 31, 51, 58], "2400": 61, "241": 29, "2488174077578": 57, "24_h": 51, "24x": 31, "25": [31, 62], "250": 58, "250221": 53, "25294047594070435": 28, "254": 29, "255": [19, 28, 35], "256": [28, 31, 35, 51, 62], "26": 35, "2600": 51, "2607155": 53, "2636094": 53, "26531240344047546": 28, "266": 29, "268435456": 2, "269": 28, "27": [16, 29, 32, 62], "272": 30, "27642": 42, "277716": 61, "277811": 61, "278": 29, "28": [29, 31, 32, 38, 42, 49, 51], "280": 62, "29": [29, 31], "290": 29, "298973": 53, "299": 35, "2nd": 41, "2tb": 31, "2x": [31, 35], "2x256x10": 62, "3": [2, 4, 7, 16, 18, 20, 22, 24, 25, 26, 28, 29, 30, 31, 32, 33, 35, 38, 39, 40, 41, 42, 45, 46, 49, 52, 53, 62], "30": [14, 16, 31, 35, 49, 51, 62], "3000765": 53, "3007": 31, "300x300": [31, 49], "302": 29, "303": 28, "305706": 53, "31": [29, 37], "312": [31, 51], "314010": 51, "314064": 51, "314090": 51, "314113": 51, "314135": 51, "314165": 51, "314197": 51, "314260": 51, "314455": 51, "314478": 51, "314505": 51, "314589": 51, "315": 29, "318963": 53, "32": [16, 18, 25, 26, 28, 29, 31, 33, 47, 51, 57, 61], "3200": 31, "3221133": 53, "3265": 31, "327": 29, "327398": 53, "328223477737884": 54, "33": 14, "3343554": 62, "3359": 28, "3359284": 62, "3364005982875824": 28, "339": 29, "3391027": 53, "34": 29, "3455": 28, "3461": 31, "35": [29, 31, 42], "350w": 31, "351": 29, "3549364": 53, "3555": 28, "3587": 31, "36": [29, 31, 35, 49], "364": 29, "3670": 28, "37": 16, "3753": 28, "376": 29, "3787665": 53, "38": [29, 31], "3804817": 53, "381424": 53, "384": 31, "3870": 31, "388": 29, "39": [29, 31], "3905785": 53, "3999124": 53, "3d": 44, "3dunet_itex": 55, "3dunet_itex_with_horovod": 55, "3e": [51, 57], "3f": 35, "3rd": [4, 21, 31, 41], "4": [14, 17, 18, 20, 24, 25, 28, 29, 30, 32, 35, 38, 51, 53, 58, 60, 62], "40": [14, 16, 29, 31, 42, 51], "400": [29, 61], "404": 29, "405": 29, "408512": 61, "4096": [19, 28], "40ghz": 31, "41": [16, 28], "41249612335034": 57, "413": 29, "416651": 62, "419072": 62, "42": 31, "42261": 53, "425": 29, "43": [16, 29, 31, 42], "435": 31, "438": 29, "44": [11, 16, 29], "4498": 28, "452": 29, "45x": 31, "461180928": 51, "465": 29, "47": [16, 29, 61], "4718971": 53, "479": 62, "479142": 53, "47eb": [37, 42], "48": [16, 29, 51, 61], "480": 29, "4800": 31, "481086": 53, "4818356": 53, "49": [29, 61], "4929404": 53, "494": 29, "4d": 25, "4th": [31, 41, 47], "5": [11, 18, 19, 20, 22, 25, 28, 30, 33, 35, 39, 40, 41, 51, 53, 57, 62], "50": [29, 31, 35], "5000": 31, "5063303": 53, "509": 29, "50ghz": 32, "51": [16, 29, 31, 51], "510076": 14, "51179520": 51, "512": [31, 51, 57], "5120": 62, "512x512": 31, "517385": 53, "52": [16, 28, 29, 51], "523": 31, "5294489860534668": 28, "53": [29, 31], "5300783": 53, "5333": 37, "54": 58, "5479512": 53, "549": 29, "55": [14, 16, 29, 31, 32, 35, 62], "550": 29, "555174": 61, "555221": 61, "5597944": 53, "56": [16, 29, 31, 32, 35], "57": 31, "5774": 51, "57x": 31, "58": 29, "586": 29, "59": [16, 29], "590331": 61, "594147": 62, "595": 51, "596": [37, 42, 51], "597": 51, "597360": 62, "598": 51, "5e": 51, "5th": 31, "6": [18, 26, 28, 30, 31, 33, 42, 49, 51], "60": [28, 29, 31, 35, 51], "600": [51, 61], "60000": [19, 28], "600w": 31, "601": 51, "602": 51, "6027272": 53, "602742": 61, "603262": 61, "604": [29, 51], "6047": 31, "605": 29, "606": 51, "607": 51, "6153628825864496": 47, "6240": 28, "63": [16, 29], "6336y": 31, "6342418": 53, "634554": 62, "64": [14, 16, 17, 19, 28, 29, 31, 35, 37, 39, 41, 42, 51, 56], "640x640": 49, "6416": 51, "6422923": 53, "6456823": 53, "6461415": 53, "6514435": 53, "65504": 28, "6628485": 53, "66fa74b6a2a0bb1e563ae8bce66496b118b95200": 54, "67": [16, 29, 31], "6761076": 53, "68": 29, "6867": 31, "69": 31, "692": 31, "6926193": 53, "693": 29, "694": 29, "69612": 49, "699": 31, "7": [18, 28, 29, 30, 31, 33, 49, 51, 54], "7090344": 53, "71": 29, "7112d33": 33, "718459": 53, "72": [29, 49], "7239000201225281": 28, "7296917": 53, "7297122": 53, "730m": 14, "736": 31, "74": 31, "7494": 28, "75": [29, 31], "7520": 28, "757": 29, "76": [25, 29, 31, 51], "768": 51, "768_a": 51, "772": 29, "773": 11, "7787259": 53, "784": [19, 28, 29, 35], "79": 29, "790128": 61, "790632": 62, "792936": 62, "795": 29, "7987": 28, "7f": 51, "8": [18, 25, 28, 29, 31, 33, 40, 41, 42, 49, 51, 52], "80": [29, 31], "800": 61, "803": [37, 42], "806": 29, "81": [31, 51, 54, 57], "810": 51, "817": 29, "8180m": 32, "8192": [19, 28], "81m": 28, "82574l": 31, "828": 29, "83": [29, 31, 32, 51], "839": 29, "83m": 28, "84": [29, 31, 32], "841192": 25, "8413447": 25, "8480": [31, 35], "84m": 28, "85": 35, "850": 29, "8500": [3, 34], "8501": 34, "8534": 28, "85485": 53, "8598063": 53, "85m": 28, "86": [16, 31], "8672705": 53, "867908472383153": 47, "87": [29, 31], "870": 31, "875052": 53, "8751": 28, "88": [29, 57], "8809638": 53, "8819": 28, "8863": 28, "8876": [37, 42], "888000e": 51, "8880196": 53, "8888": [41, 42, 47, 52, 54, 56], "88eb3cff2f03dad85035621d041e23a14345999": 55, "891": 29, "892": 29, "8941312": 53, "8972": 28, "89942324": 53, "8x16gb": 31, "9": [14, 18, 25, 26, 29, 30, 37, 38, 39, 41, 42, 45, 46, 56, 62], "9000": 5, "908": 29, "909": 29, "91": [29, 31], "911": 29, "9154005": 53, "9168000221252441": 28, "917546": 61, "917738": 61, "918": 31, "92": [29, 31], "924008369445801": 28, "9259825": 53, "9260886": 53, "9266936945121049176": 2, "928": 31, "92880015134813": 47, "92x": 31, "93": 31, "930": 29, "9349675": 53, "9373732": 53, "9377": 28, "9381000399589539": 28, "9381838": 53, "93901324": 53, "94": 16, "940695": 58, "9410": 28, "947": 29, "948": 29, "9486000537872314": 28, "949225": 53, "95": [29, 31], "951": 29, "9536000490188599": 28, "96": [29, 31, 40, 51], "9631021": 53, "9677248": 53, "968": 31, "96x": 31, "97": 16, "9702091": 53, "9746864": 53, "9755": 28, "98": 16, "9842": 31, "9873173": 53, "988714": 53, "99": 16, "9959502": 25, "9963627": 25, "999": [25, 26], "99998": 25, "A": [0, 5, 17, 18, 24, 28, 29, 32, 33, 34, 36, 42, 44, 47, 58], "And": [30, 37, 41, 42, 51], "As": [17, 24, 28, 29, 32], "At": [16, 17, 21, 45, 54], "Being": 0, "But": [27, 28], "By": [13, 20, 28, 29, 32, 52], "For": [0, 1, 2, 4, 7, 11, 14, 15, 18, 19, 20, 23, 25, 26, 28, 29, 31, 33, 34, 35, 37, 42, 47, 48, 49, 50, 51, 54, 55, 56, 57, 58, 60, 61, 62], "If": [2, 3, 5, 20, 22, 25, 26, 27, 28, 29, 32, 33, 35, 37, 39, 40, 41, 42, 45, 47, 48, 49, 51, 52, 53, 54, 55, 56, 57, 60], "In": [4, 11, 16, 18, 19, 27, 28, 29, 30, 32, 35, 36, 38, 45, 47, 49, 52, 53, 58, 62], "It": [4, 11, 14, 15, 16, 17, 18, 19, 20, 21, 28, 30, 32, 35, 36, 38, 39, 44, 51, 52, 55, 56, 60, 63], "NOT": [7, 14], "No": [0, 14, 19, 22, 35, 39, 47, 48, 51, 54, 55, 56, 57, 60], "Not": 20, "ON": [17, 31, 33, 47, 62], "Of": 51, "On": [28, 32, 37, 41, 42], "One": [29, 32], "That": [14, 32, 39, 40, 47], "The": [0, 2, 4, 5, 7, 9, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 24, 25, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 45, 47, 49, 51, 52, 55, 56, 57, 58, 60, 61, 62], "Their": 28, "Then": [3, 11, 22, 33, 41, 42, 52], "There": [21, 27, 36, 39, 45, 47, 52, 61], "These": [16, 24, 28, 29, 63], "To": [2, 3, 4, 7, 16, 18, 19, 24, 27, 28, 32, 36, 37, 39, 40, 41, 42, 45, 51, 52, 54, 55, 60], "With": [18, 19, 28, 29, 30, 45, 48, 53, 54], "_": [0, 11, 13, 14, 17, 18, 20, 22, 24, 27, 28, 29, 30, 32, 33, 34, 35, 37, 39, 40, 46, 47, 49, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61], "__del__": 56, "__init__": 35, "__main__": [29, 35], "__name__": 35, "__version__": [11, 33, 37, 39, 40, 41, 42, 63], "_gbs1_": 51, "_gbs2_": 51, "_pywrap_itex": 39, "_timestamp_inst": 29, "_timestamp_instance_n_cor": 29, "a100": 54, "a380": [39, 40], "a730m": [39, 40], "a930253": 33, "abl": 5, "about": [0, 7, 19, 32, 34, 35, 45, 51, 52, 58], "abov": [18, 19, 22, 28, 29, 32, 37, 47, 51, 52, 55, 56, 57, 58, 60, 62], "absolut": [29, 51], "abus": 0, "acceler": [4, 14, 16, 30, 31, 33, 44, 47, 52, 63], "accept": [0, 7, 17], "access": 37, "accmatmul": 24, "accord": [17, 18, 47, 56, 58, 61], "accordingli": 62, "account": 0, "accumul": 31, "accur": 36, "accuraci": [15, 18, 19, 25, 28, 44, 45, 52, 58, 61], "achiev": [18, 32], "acm": [39, 40], "across": [16, 20, 25], "act": [0, 21, 34], "action": [0, 5, 36], "activ": [11, 18, 19, 22, 25, 28, 32, 33, 37, 38, 39, 40, 41, 42, 46, 47, 48, 52, 53, 55, 56, 58, 60], "ad": [5, 13, 17, 18, 21, 23, 28, 39, 51, 62], "adam": 25, "adamw": 25, "adamwithweightdecayoptim": 26, "adapt": 0, "add": [3, 4, 5, 17, 18, 19, 24, 27, 32, 34, 37, 39, 40, 47, 54, 62], "add_weight": 35, "add_with_xla": 30, "addit": [8, 21, 23, 24, 32, 36, 40, 63], "addition": [18, 28], "addn": 24, "addon": [26, 58], "address": [0, 32, 37], "adher": 63, "adjust": [20, 25, 51], "adjusted_init_lr": 51, "adopt": [4, 15, 16, 21], "advanc": [0, 4, 20, 30, 33, 44, 63], "affect": [0, 18, 28], "affin": 32, "after": [2, 17, 18, 19, 22, 24, 26, 27, 28, 32, 33, 36, 37, 38, 42, 45, 51, 56], "afterward": [28, 29, 32], "ag": 0, "again": 28, "against": 7, "agent": 37, "aggress": [0, 16, 18, 19], "ahead": [39, 40], "ai": [44, 45, 50, 52, 63], "aim": 63, "aka": 21, "akdlm": [37, 42], "al": 25, "alexnet": 44, "alg": 11, "alg_kind_": 11, "algebra": [4, 16, 30], "algo": 11, "algorithm": [11, 25], "align": [0, 13], "all": [0, 7, 11, 14, 18, 20, 21, 25, 27, 28, 30, 32, 37, 42, 45, 47, 51, 62], "allocate_output": 11, "allow": [0, 16, 18, 28, 32, 35, 56, 63], "allowlist": 18, "allowlist_add": [18, 19], "allowlist_remov": 18, "almost": 21, "along": [30, 32], "alpha": 11, "alpha_": 11, "alreadi": [18, 28, 38, 45], "also": [0, 4, 7, 15, 16, 17, 19, 21, 23, 27, 28, 29, 30, 32, 36, 37, 38, 41, 42, 63], "altern": 18, "although": 32, "alwai": [18, 28, 36], "alwayslink": [11, 34], "am": 51, "among": [29, 32], "amount": [14, 28], "amp": [4, 18, 29, 31, 44, 55, 60, 63], "ampthre": 18, "amx": 52, "amx_bf16": 52, "amx_int8": 52, "an": [0, 2, 3, 4, 7, 11, 13, 14, 16, 18, 19, 21, 24, 25, 27, 28, 29, 30, 32, 34, 35, 37, 38, 39, 40, 42, 44, 49, 52, 53, 57, 62, 63], "anaconda": 38, "analysi": [16, 32], "analyt": 45, "analyz": [16, 22], "ani": [0, 4, 11, 16, 20, 21, 23, 24, 27, 28, 29, 37, 38, 39, 42, 45, 53, 56], "annot": 17, "anoth": [29, 32, 36], "answer": 0, "antirectifi": 35, "aot": [39, 40], "apach": 63, "api": [4, 7, 9, 10, 14, 15, 16, 19, 25, 26, 27, 28, 30, 32, 34, 40, 52, 53], "apolog": 0, "apologi": 0, "appear": [0, 28], "append": [35, 37, 41, 42], "appli": [0, 16, 17, 25, 28, 33, 34, 51, 54, 55, 57, 60, 62], "applic": [4, 21, 23, 31, 32, 33, 34, 36, 45], "apply_gradi": 28, "appoint": 0, "approach": [4, 16, 38], "appropri": [0, 3, 32, 39, 40], "approv": 7, "approxim": [11, 25], "approximate_": 11, "apt": [7, 34, 37, 39, 42], "ar": [0, 2, 4, 5, 7, 11, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 32, 34, 36, 37, 39, 40, 41, 42, 44, 45, 47, 51, 52, 53, 55, 58, 61, 63], "arang": 25, "arc": [14, 39, 40, 42, 47, 63], "arch": 37, "architectur": [11, 16], "archiv": 37, "area": 13, "arg": [2, 13, 33], "argument": [13, 25, 28, 29, 33], "around": [0, 29, 51], "arrai": 25, "articl": 32, "as_graph_el": 35, "ask": [4, 36, 39, 40], "aspect": 28, "assign": [29, 32, 40], "assign_i": 40, "assign_x": 40, "assist": 8, "assum": [17, 28, 32, 38, 39, 40, 51, 55, 60], "assumpt": [2, 3], "astyp": [19, 28, 35, 53], "ats": [39, 40], "atsp": 28, "attach": [2, 3, 28, 32], "attack": 0, "attent": [0, 20], "attr": [11, 20], "attribut": [24, 33], "auto": [4, 11, 17, 27, 29, 30, 33, 40], "auto_mixed_precis": [18, 19, 33, 47], "auto_mixed_precision_log_path": [20, 33], "auto_mixed_precision_opt": [18, 19, 47], "auto_mixed_precision_optionsgraph_opt": 18, "auto_mod": [17, 62], "auto_sharding_pass": 17, "auto_sharding_pass_mlir": 17, "autom": [21, 29], "automat": [4, 5, 16, 17, 18, 19, 21, 26, 28, 29, 31, 32, 33, 37, 42, 44, 48, 53, 62], "automixedprecis": 18, "automixedprecisionopt": [18, 19, 47], "automixedprecosionopt": 18, "autoshard": [17, 62], "ava": 49, "avail": [0, 2, 3, 11, 14, 19, 25, 29, 32, 35, 36, 39, 40, 41, 42, 55], "averag": 51, "avgpool": [18, 19, 49], "avgpool3d": [18, 19], "avoid": [0, 4, 24, 27, 28, 29, 32, 35, 38, 51], "avx512": [4, 21, 52], "avx_vnni": 52, "awk": 51, "axi": [25, 26, 35], "b": [30, 35, 40, 47, 49, 51, 52, 61, 62], "b4ab4b8f8b3a41fade4899fd00b5b2d2dad0981f3e1bb10df4c522975fd7": 40, "b7a8": [37, 42], "ba": 25, "back": [17, 28, 39], "backend": [4, 16, 21, 23, 26, 27, 28, 33, 42, 47, 48, 52, 53, 63], "background": 32, "background_thread": 29, "backward": [11, 28], "balanc": [18, 19, 31, 35], "bare": 44, "base": [7, 11, 14, 15, 16, 18, 19, 25, 31, 32, 37, 38, 41, 44, 47, 51, 52, 57, 58, 62, 63], "base_config": 35, "base_shap": 35, "basekit": [37, 38, 42], "bash": [2, 37, 38, 39, 40, 47, 51, 52, 60, 63], "bashrc": 38, "basi": 37, "basic": [18, 19, 20, 28], "batch": [17, 25, 28, 29, 31, 51, 62], "batch_siz": [16, 17, 19, 28, 35, 55, 62], "batch_size_per_gpu": 51, "batchmatmul": [24, 26], "bazel": [3, 11, 34], "bazelbuild": [7, 39, 40], "bazelrc": 39, "becaus": [18, 19, 28, 36], "becom": [13, 32, 36], "been": [28, 32, 54, 62], "befor": [5, 7, 11, 16, 18, 19, 24, 27, 28, 29, 32, 35, 36, 39, 40, 44, 62], "begin": [7, 11, 47], "behavior": [0, 27, 28, 29, 32, 36, 51], "being": 32, "below": [2, 3, 24, 25, 28, 29, 30, 31, 32, 33, 37, 39, 42, 51, 56], "benchmark": [7, 16, 31, 35, 55, 61], "benefit": [4, 21, 28, 32, 33], "bert": [16, 20, 25, 36, 44], "bert_base_dir": 16, "bert_base_model": 16, "bert_config": [16, 57], "bert_config_fil": [16, 57], "bert_larg": 16, "bert_large_dir": 57, "bert_model": [51, 57], "bert_prep_working_dir": 51, "besid": [21, 32], "best": [0, 14, 16, 27, 37], "beta": 11, "beta_": 11, "beta_1": [25, 26], "beta_2": [25, 26], "beta_constraint": [25, 26], "beta_initi": [25, 26], "beta_regular": [25, 26], "better": [4, 15, 16, 18, 19, 21, 24, 25, 27, 29, 32, 35, 36, 44, 51, 52, 54, 55, 60], "between": [16, 17, 18, 19, 21, 32, 34, 35, 39, 54, 61, 62], "bf16": [18, 19, 24, 31, 44, 45, 47, 51, 55, 60, 61, 62], "bf32": 20, "bfloat16": [4, 11, 18, 19, 21, 24, 28, 33, 47, 51, 55, 57, 60], "bfloat16graph_opt": 19, "bia": [13, 20, 24, 53], "bias_add": 53, "bias_initi": [25, 26], "biasadd": [20, 26], "biasaddgrad": 24, "big": 45, "bin": [3, 7, 11, 29, 34, 39, 40, 46, 47, 48, 52, 55, 56, 58, 60], "bin_threadpool": 3, "binari": [18, 34, 39, 40], "bind": [13, 30, 32, 40], "bind_al": 22, "bit": [15, 18, 28, 33, 37, 39, 41, 42, 47], "blob": [21, 34], "block": [11, 32, 33, 35, 36, 42], "blocker": 45, "blocktim": 32, "blog": 16, "board": 31, "bodi": 0, "bookcorpu": [31, 51], "bool": 11, "boolean": [24, 29], "boost": [4, 21, 29, 31, 32], "both": [4, 7, 14, 15, 18, 19, 23, 27, 29, 30, 31, 32, 33, 39, 47, 61], "bound": 32, "box": 15, "brain": 55, "branch": [5, 7, 39], "break": 24, "bridg": [21, 34], "briefli": 32, "bring": [23, 28, 29, 63], "browser": [5, 22, 41, 42, 49, 52, 54, 56], "bs1": 49, "bt": 35, "bu": [2, 30], "buffer": [16, 49], "bug": [7, 63], "buid": 40, "build": [4, 7, 9, 35, 43, 44, 45, 51, 63], "build_doc": 5, "build_pip_packag": [11, 39], "build_tmp": 5, "build_with_threadpool": 40, "builder": 61, "buildifi": 7, "buildtool": 7, "built": [11, 16, 34, 41, 42], "bus_id": 2, "busi": 32, "bzl": 7, "c": [2, 4, 10, 11, 14, 29, 30, 32, 35, 37, 38, 39, 41, 42, 43, 56, 63], "c481324031ecf0f70f8939516c02e16cac60446d": 60, "c_api_experiment": 40, "c_str": 40, "cach": [12, 15, 32, 35, 51], "calcul": [29, 54], "calibr": 52, "call": [11, 15, 16, 26, 28, 30, 32, 33, 35, 36, 43, 46, 52, 53, 56, 57], "callabl": 56, "can": [2, 3, 4, 7, 11, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 25, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 45, 51, 55, 56, 60, 61, 62, 63], "cannot": [14, 18, 27, 35, 47, 48, 51, 54, 55, 57, 60], "capabl": [4, 14, 27, 28], "capi": 30, "card": [20, 51, 58], "case": [4, 13, 18, 19, 21, 28, 29, 32, 35, 47], "cast": [0, 18, 24, 28, 49], "cat": 29, "catch": 11, "caus": [27, 28, 32, 35, 56], "cbica": 55, "cc": [3, 11, 14, 17, 28, 30, 34, 42, 58, 62], "ccl": [38, 42], "cd": [2, 5, 7, 16, 32, 34, 39, 40, 47, 51, 54, 55, 57, 58, 60, 62], "cell": [28, 54], "center": [1, 4, 16, 21, 25, 26, 33, 39, 40, 42, 45, 47, 50, 51, 52, 54, 55, 56, 57, 58, 60, 61, 62, 63], "cento": 41, "certain": [16, 29, 32], "challeng": 55, "chanc": [18, 28], "chang": [4, 5, 7, 11, 18, 19, 20, 21, 23, 27, 28, 29, 30, 36, 38, 44, 45, 56, 58], "channel": [0, 24, 25, 43], "channels_last": 62, "characterist": 0, "cheap": 35, "check": [5, 7, 11, 13, 14, 18, 19, 21, 23, 28, 29, 37, 38, 39, 40, 45, 46, 47, 57, 63], "checker": 32, "checkout": [5, 34, 40, 55, 60, 62], "checkpoint": 51, "choos": [16, 23, 25, 27, 28, 29, 32, 35, 39, 40, 43, 47, 49, 52, 53, 55], "chrome": 5, "circular": 27, "ckpt": [51, 57], "clang": 7, "clarifi": 0, "clariti": 0, "class": [0, 11, 28, 33, 35], "classic": 32, "classif": 22, "classifi": [44, 61], "classifier_train": 61, "classify_text_with_bert": 56, "claus": [4, 21, 23], "clean": [11, 40], "clearlist": 18, "clearlist_add": 18, "clearlist_remov": 18, "click": [11, 39, 40], "client": [2, 30, 40], "client_sess": 40, "clientsess": 40, "clock": 14, "clone": [5, 16, 34, 39, 40, 51, 54, 55, 57, 60, 61, 62], "close": [25, 27, 32], "closer": 24, "cluster": [27, 38], "cm": 37, "cmake": 39, "cnn": [18, 31, 32, 44, 45], "co": [4, 14, 15, 21], "coco": [31, 49, 60], "coco17": 49, "code": [2, 4, 5, 9, 11, 16, 20, 21, 22, 23, 27, 30, 31, 32, 34, 35, 43, 44, 45, 47, 49, 52], "codebas": [4, 30], "codenam": 4, "colab": 28, "collabor": [16, 63], "collect": [2, 32, 42], "color": 0, "com": [0, 5, 7, 8, 16, 21, 28, 32, 34, 35, 37, 38, 39, 40, 42, 45, 47, 49, 51, 52, 54, 55, 56, 57, 58, 60, 61, 62, 63], "combin": [16, 21, 29, 32, 54], "come": 4, "comma": 32, "command": [2, 3, 14, 22, 29, 32, 37, 38, 39, 40, 41, 42, 46, 47, 49, 52, 57], "comment": [0, 7, 14], "commit": [0, 5, 17, 34], "common": [0, 11, 14, 17, 21, 32, 44, 51], "common_runtim": [11, 30], "commonli": 32, "commun": [0, 2, 7, 9, 21, 23, 32, 42, 63], "compact": [29, 32, 35], "compar": [16, 18, 28, 32, 44], "compat": [2, 3, 4, 15, 19, 21, 23, 26, 28, 30, 33, 35, 51, 52, 54, 55, 56, 57, 60, 61], "compet": 32, "competit": 32, "compil": [4, 11, 14, 16, 19, 21, 27, 28, 30, 32, 33, 34, 35, 36, 37, 38, 40, 42], "compiler_vers": 33, "complaint": 0, "complet": 32, "complic": [21, 29], "compon": [17, 19, 31, 33, 37, 38, 39, 40, 42], "compos": 17, "compressor": [4, 15, 21, 44, 45, 52], "comput": [4, 11, 15, 16, 25, 28, 32, 35, 37, 45, 53, 54, 63], "compute_dtyp": 28, "compute_gradi": 28, "concat": 35, "concaten": [35, 54], "concatv2": 49, "concept": [16, 28, 32], "concrete_funct": 35, "concurr": [4, 13, 20, 32, 35], "conda": [4, 14, 43, 51, 56], "conda_prefix": 29, "conduct": [7, 29], "conduit": [4, 30], "conf": 29, "config": [11, 14, 17, 18, 19, 28, 34, 35, 37, 39, 40, 42, 47, 52, 58, 61, 62], "config_fil": 61, "configproto": [17, 18, 19, 47, 52, 62], "configur": [4, 8, 11, 14, 17, 19, 21, 23, 28, 29, 33, 35, 37, 42, 49, 61, 63], "confirm": [29, 39, 40], "conflict": 35, "conform": 7, "connect": 32, "consecut": 32, "consequ": 0, "consid": [0, 18, 58], "consist": [7, 28], "consol": 42, "const": 40, "constant": [11, 15, 16, 25, 26, 28, 30], "constant_fold": 52, "constraint": 25, "construct": [0, 11, 17, 28], "constructor": 28, "consum": 51, "consumpt": [19, 21, 28, 47], "contact": 8, "contain": [5, 9, 15, 17, 27, 29, 32, 34, 43, 44, 55, 60, 63], "content": [5, 40, 42], "context": [11, 25, 32], "contigu": 32, "continu": [0, 14, 18, 27, 28], "contrast": 16, "contribut": [0, 4, 14, 21, 29, 39], "contributor": [7, 63], "control": [31, 32, 44, 52, 62], "conv": [17, 24, 53], "conv2d": [4, 21, 49, 53], "conv3d": 24, "convent": 7, "convers": [17, 18, 19, 24], "convert": [15, 16, 17, 18, 19, 28, 36, 45, 47, 49, 55, 61], "convert_to_tensor": 11, "convgradfilt": 24, "convolut": 32, "cooper": [4, 21, 44, 49, 52], "copi": [2, 3, 40], "copt": [11, 34], "copyright": 7, "core": [9, 11, 14, 17, 26, 28, 30, 31, 32, 35, 39, 40, 42, 52, 53, 58, 62], "core_id": 29, "core_list": 29, "correct": [28, 35, 39, 40], "correspond": [18, 29, 30, 36], "correspondli": 61, "cost": 15, "costli": 32, "could": [0, 18, 28, 33, 40, 45, 51, 52], "count": 14, "coupl": 32, "coven": [7, 63], "cover": [19, 21, 24, 29, 32], "cp": [3, 40, 51], "cp311": 40, "cpp": [3, 14, 17, 37], "cpplint": 7, "cpu": [2, 3, 4, 9, 11, 14, 15, 16, 18, 19, 20, 23, 24, 28, 31, 33, 34, 36, 43, 44, 45, 49], "cpudevic": 11, "cpunodebind": 32, "crash": 56, "creat": [11, 18, 28, 29, 30, 33, 36, 38, 42, 46, 49, 52, 55, 60, 62], "create_datasets_from_start": 51, "creatednnlengin": 11, "creatednnlstream": 11, "creation": 13, "critic": 18, "cross": [29, 32], "ctl": 61, "ctx": 11, "cuda": 28, "cuda_diagnost": 28, "cuda_driv": 28, "cuinit": 28, "curl": 38, "current": [14, 17, 22, 33, 51, 55, 60, 62], "custom": [4, 7, 9, 16, 18, 21, 26, 27, 29, 33, 37, 42, 51], "custom_graph_optimizer_registri": 58, "cv": 54, "cvfh": 3, "d": [7, 35, 37, 39, 40, 61], "d50dnp1sbb": 31, "dai": 51, "danger": 18, "dashboard": 22, "data": [4, 15, 16, 17, 18, 21, 22, 25, 28, 33, 35, 39, 40, 42, 45, 47, 49, 50, 51, 52, 54, 55, 56, 57, 58, 60, 61, 62, 63], "data_dir": [16, 51, 55, 60, 61], "data_f32": 11, "data_format": [20, 62], "data_typ": [18, 19, 47], "dataset": [19, 28, 31, 35, 52, 58], "dataset_dir": [55, 60], "datatyp": [33, 40, 51, 55, 60], "dch": 37, "dcmake_build_typ": 39, "ddr4": 31, "ddr5": 31, "de6201297144": [37, 42], "dealloc": 32, "dearmor": 37, "deb": [37, 39], "debug": [11, 20, 22, 33], "debugalloc": 32, "decai": 25, "decayed_learning_rate_at_crossover_point": 51, "decid": 17, "decis": [0, 17], "declar": 11, "decoupl": [25, 30], "dedic": 7, "deem": 0, "deep": [15, 25, 27, 32, 36, 44, 63], "deeper": 23, "deeplearningexampl": [31, 51, 55, 60], "def": [28, 30, 35], "default": [4, 7, 13, 14, 15, 18, 19, 20, 21, 23, 27, 28, 30, 31, 32, 33, 35, 39, 40, 51, 52, 53, 60, 61, 62], "default_data_typ": [18, 33], "default_dataset": 49, "default_static_qconfig": 49, "defin": [4, 16, 28, 40], "definit": [7, 18, 23, 33], "deleg": 15, "deliv": [4, 19, 21, 27], "delta_tim": 35, "demand": [13, 63], "demo": 22, "demonstr": [0, 31, 44], "denali": 31, "deni": 18, "dens": [19, 20, 28, 35], "dense1": 28, "dense2": 28, "dense_1": [19, 28], "dense_2": [19, 28], "dense_logit": [19, 28], "denylist": 18, "denylist_add": 18, "denylist_remov": 18, "dep": [11, 34], "depend": [14, 16, 19, 29, 32, 36, 37, 39, 40, 42], "deploi": [21, 34], "deploy": [38, 41, 42], "deprec": 39, "depthwiseconv2dn": 49, "dequant": [49, 52], "derogatori": 0, "desc": [11, 13], "descibl": 11, "describ": [25, 28, 29, 32], "descript": [9, 13, 18, 29, 32, 33, 44, 56], "descriptor": 11, "design": [4, 7, 9, 21, 30, 34, 45], "desir": [18, 29], "destruct": 32, "detail": [2, 3, 11, 15, 16, 17, 18, 19, 21, 23, 25, 28, 32, 33, 36, 37, 39, 40, 42, 45, 47, 51, 63], "detect": [32, 49], "determin": [0, 11, 28, 32], "dev": [2, 3, 14, 22, 34, 39, 42, 47, 57], "develop": [4, 14, 16, 21, 30, 32, 37, 39, 40, 41, 42, 63], "deviat": 25, "devic": [2, 3, 4, 9, 10, 11, 13, 14, 16, 17, 19, 20, 21, 22, 23, 24, 28, 33, 34, 39, 40, 42, 47, 62, 63], "device_cpu": 11, "device_gpu": [11, 17, 62], "device_lib": 2, "device_num": [17, 62], "device_typ": [2, 14, 17, 39, 40, 58, 62], "diagram": 63, "dialect": [16, 17], "dict": 35, "did": [28, 32], "diff_undef": 11, "diffent": 27, "differ": [0, 2, 4, 13, 16, 20, 21, 23, 25, 29, 30, 32, 33, 35, 36, 43], "differenct": [39, 40], "differenti": 39, "difficult": 30, "diffus": [44, 63], "digit": [19, 28], "dim": 13, "dimens": 17, "dir": [2, 3, 7, 51, 55, 56, 57, 60], "directli": [11, 14, 17, 27, 28, 29, 32, 36, 42], "directori": [2, 3, 4, 5, 7, 14, 17, 29, 34, 37, 39, 40, 42, 47, 48, 49, 51, 54, 55, 57, 60], "diretcori": 40, "disabl": [0, 15, 19, 27, 29, 30, 32, 33], "disable_numactl": 29, "disable_taskset": 29, "disbal": 39, "discontinu": 14, "discuss": 7, "disk": [36, 49], "disparag": 0, "displai": [20, 49], "distanc": 54, "distinguish": [28, 30], "distribut": [2, 4, 8, 31, 32, 37, 38, 42, 43, 44, 51, 60, 61, 63], "distribution_strategi": 62, "divers": 0, "divid": [25, 28, 32], "divis": 28, "dl": 7, "dll": 51, "dllogger": [55, 60], "dllvm_enable_project": 39, "dnnl": [11, 13], "dnnl_arg_dst": 11, "dnnl_arg_scratchpad": 11, "dnnl_arg_src": 11, "do": [7, 14, 19, 27, 28, 29, 33, 36, 39, 52], "do_benchmark": 35, "do_lower_cas": 16, "do_predict": [16, 57], "do_train": [16, 57], "doc": [5, 9, 11, 39, 56], "doc_strid": 57, "docker": [9, 43, 44], "dockerfil": 2, "dockerhub": 63, "docs_build": 9, "docstr": 11, "document": [2, 3, 28, 31, 36, 38, 39, 40], "doe": [16, 24, 27, 28], "doesn": [5, 17, 18, 36, 56], "domin": 28, "don": [28, 49], "done": [7, 22, 28, 32, 35, 37], "doubl": 28, "download": [2, 8, 28, 32, 37, 42, 49, 51, 60, 61], "download_and_preprocess_coco": 60, "downstream": 18, "dpc": [21, 37, 38, 39, 40, 42], "dpcpp": [33, 37], "draft": 5, "dramat": 32, "dri": [2, 3, 34, 42, 47], "drive": 35, "driver": [2, 3, 14, 28, 31, 38, 45, 47, 52, 63], "drop": [18, 29, 35], "dropout": 35, "dst_mem": 11, "dst_tensor": 11, "dt_float": [20, 40], "dtype": [11, 19, 25, 26, 30, 35, 53, 62], "dtype_polici": 28, "due": [18, 27, 32, 35], "dummi": [31, 49, 61], "dummy_v2": 49, "dump": [20, 35], "duplic": 39, "dure": [0, 15, 16, 18, 19, 24, 28, 36, 38, 39, 40, 47], "dut3046": 28, "dynam": [13, 28, 32, 35, 36], "e": [0, 2, 3, 5, 11, 17, 28, 29, 34, 40, 60, 61], "each": [14, 25, 28, 29, 30, 31, 32, 62], "eager": [11, 25], "earli": 37, "easi": [16, 21, 30, 45], "easiest": 38, "easili": [16, 30, 31, 33], "ecc": 31, "echo": [37, 51], "econom": 0, "ecosystem": [16, 30, 63], "ed": 40, "edit": [0, 2], "edu": 55, "educ": 0, "effect": [18, 29, 32], "effici": [4, 16, 21, 30, 32, 34, 35, 51, 62, 63], "effort": 37, "egg": 60, "eigen": [4, 20], "either": [3, 19, 27, 49], "elaps": [32, 49], "elig": 11, "elimin": [16, 36], "els": [19, 28, 40, 61], "eltwis": 11, "eltwise_bas": 11, "eltwise_base_hdr": 11, "eltwise_forward": 11, "eltwise_gelu_erf": 11, "eltwise_gelu_tanh": 11, "eltwise_relu": 11, "eltwisebaseop": 11, "elu": 24, "email": 0, "emit": 16, "empathi": 0, "empir": 25, "en": 42, "enabl": [4, 13, 15, 16, 17, 18, 21, 22, 25, 27, 28, 29, 30, 31, 32, 33, 35, 36, 38, 39, 40], "enable_checkpoint_and_export": 62, "enable_itex_amp": 29, "enable_itex_layout_opt": 29, "enable_jemalloc": 29, "enable_op_parallel": 29, "enable_tcmalloc": 29, "enable_tensorboard": 62, "enable_tf_profil": [4, 21, 22, 28], "enable_xla": 62, "encod": 20, "encompass": 16, "encount": 14, "end": [28, 35, 39, 40, 44, 45, 52], "engin": [11, 14], "enhanc": [4, 30], "ensur": [7, 29], "enter": [2, 3, 22, 38, 39, 40], "enterpris": [31, 42], "entir": 28, "entri": 17, "enum": 33, "env": [14, 34, 38, 39, 40, 42, 46, 51, 52, 54], "env_check": [37, 38, 42, 63], "env_itex": [46, 47, 52, 54, 55, 56, 58, 60], "env_itex_cpu": [48, 56], "env_nam": 46, "environ": [0, 2, 4, 11, 13, 15, 16, 19, 21, 22, 23, 27, 28, 30, 32, 34, 35, 43, 44, 63], "environment": [30, 40], "epoch": [18, 19, 28, 35, 51, 58, 60], "epoch_loss_avg": 28, "epsilon": [25, 26], "equal": [24, 27, 32], "equival": [4, 28], "error": [4, 7, 11, 14, 20, 25, 28, 34, 47, 48, 51, 54, 55, 56, 57, 60], "errors_impl": [14, 47, 48, 51, 54, 55, 57, 60], "especi": [13, 38], "estim": [36, 63], "et": 25, "etc": [21, 30, 37, 39], "ethernet": 31, "ethnic": 0, "eu": 14, "eval_batch_s": 51, "evalu": [19, 28, 35, 54, 57], "even": [28, 29, 32, 43, 51, 63], "event": 0, "everi": [18, 20, 54], "everyon": 0, "evo": 31, "evolv": 30, "exact": 31, "exact_match": [51, 57], "exactli": 30, "exampl": [0, 2, 4, 5, 7, 9, 11, 14, 15, 20, 21, 24, 25, 26, 28, 31, 32, 33, 34, 37, 38, 45, 47, 50, 52, 56, 63], "example_test": 40, "except": [30, 33, 42, 51], "excess": 30, "exclud": 7, "exclus": 29, "excutor": 27, "exec": [11, 13], "exec_mod": 55, "execut": [2, 5, 11, 13, 15, 16, 17, 18, 19, 20, 22, 25, 28, 31, 32, 36, 39, 44, 52, 53], "executor": 15, "exist": [19, 24, 26, 28, 29, 45], "exit": 34, "exp": 18, "expect": [18, 38, 52, 63], "experi": [0, 4, 21, 23, 32], "experiment": [4, 13, 14, 22, 33, 39, 40, 42], "experimental_compil": 30, "experimental_gelu": 16, "experimental_ops_overrid": [26, 33], "explain": 18, "explan": 0, "explicit": [0, 11, 28, 32], "explicitli": [28, 29, 33, 52], "export": [4, 7, 11, 15, 16, 17, 18, 19, 21, 22, 28, 29, 30, 32, 34, 37, 38, 40, 42, 46, 47, 51, 52, 54, 57, 61, 62, 63], "expos": [21, 22, 63], "expr": 51, "express": 0, "extend": [4, 14, 21, 23, 25, 30, 32, 33], "extens": [5, 8, 9, 11, 14, 15, 16, 17, 18, 19, 20, 21, 22, 24, 25, 26, 28, 29, 30, 31, 32, 36, 38, 43, 44, 46, 47, 48, 50, 51, 53, 54, 55, 56, 57, 58, 60, 61, 62], "extent": 31, "extern": [0, 14, 40], "extra": [18, 28, 36], "extract": 51, "f": [2, 35, 40, 63], "f0": 11, "f1": [51, 57], "f502f0715979ec73c571ca5676ba58431b916f5f58ee3333": 56, "facilit": [4, 30], "factor": [21, 29], "fail": [11, 28, 33, 36], "fair": 0, "fairli": 0, "fallback": 25, "fals": [7, 16, 17, 25, 27, 28, 29, 35, 51, 57, 62], "familiar": 11, "faq": 0, "far": 28, "fashion": [4, 21], "fast": 25, "faster": [18, 19, 25, 27, 28, 32, 35, 36, 47, 49], "fatal": 14, "fdc7a2bc": [37, 42], "featur": [4, 7, 8, 11, 13, 17, 25, 32, 36, 39, 44, 52, 62, 63], "feedback": [0, 7], "fetch": 40, "few": [28, 61], "fewer": 28, "fi": 61, "fi_provid": 38, "fid": 54, "field": [33, 39, 40], "fig": [16, 36], "figur": [16, 30, 32], "file": [2, 5, 7, 14, 17, 18, 22, 29, 34, 37, 42, 47, 48, 49, 51, 54, 55, 56, 57, 60, 61, 63], "filenam": 35, "fill": [39, 40], "filter": 7, "filter_height": 53, "filter_width": 53, "final": [17, 19, 28, 51], "final_carry_st": 25, "final_memory_st": 25, "find": [7, 11, 22, 31, 32, 34, 36], "fine": [28, 29, 31, 32, 35, 51], "finish": [28, 35, 39, 53, 56], "first": [17, 18, 19, 22, 24, 25, 27, 28, 29, 30, 32, 37, 38, 39, 41, 42, 51, 55, 60], "fit": [19, 32, 35], "fix": [7, 28, 37], "flag": [17, 30, 40, 60], "flex": [39, 40, 42, 45, 47, 50, 52, 54, 57, 63], "flexibl": [4, 30, 33, 35], "flexibli": 63, "float": [11, 18, 20, 28, 33, 40, 47], "float16": [4, 16, 18, 19, 21, 28, 33, 47], "float16graph_opt": [18, 19], "float32": [11, 19, 24, 25, 26, 28, 30, 35, 51, 53, 55, 60], "flow": [16, 28], "flower": 52, "focus": [0, 30], "fold": 15, "folder": [2, 3, 19, 34, 39, 40, 61], "follow": [0, 2, 3, 7, 15, 16, 17, 18, 22, 24, 27, 28, 29, 31, 32, 33, 34, 35, 37, 38, 39, 40, 41, 42, 43, 45, 47, 48, 51, 53, 54, 55, 56, 57, 60, 61, 62, 63], "follw": 62, "footprint": 36, "forg": [14, 56], "fork": [32, 35], "format": [7, 9, 18, 24, 28, 33, 35, 36, 61], "forth": 63, "forward": [11, 28, 54], "forward_train": 11, "found": [7, 14, 28, 29, 32, 34, 36, 39, 51], "four": 18, "fp": 47, "fp16": [16, 18, 19, 31, 44, 47, 51], "fp32": [16, 18, 19, 20, 24, 31, 44, 45, 49, 51, 52, 60], "fpn": 49, "fraction": 16, "framework": [14, 16, 30, 35, 36, 37, 40, 47, 48, 50, 51, 54, 55, 57, 60], "free": [0, 21, 29], "frequenc": [14, 31], "frequent": [4, 36], "friendli": 32, "from": [0, 3, 5, 7, 11, 16, 17, 18, 19, 21, 22, 27, 28, 29, 30, 32, 33, 35, 36, 37, 39, 43, 44, 47, 49, 50, 51, 52, 55, 56, 63], "from_logit": 35, "from_model": 49, "from_tensor_slic": 28, "frontend": [4, 16, 21, 23], "frozen": 19, "fr\u00e9chet": 54, "full": [7, 39, 40, 42], "fulli": [4, 19, 21, 30, 35], "function": [5, 17, 20, 21, 23, 25, 26, 28, 30, 32, 33], "fundament": 16, "further": [4, 16, 21], "fuse": [4, 16, 18, 19, 21, 24, 26, 51], "fusedaccmatmul": 24, "fusedbatchnorm": 24, "fusedbatchnormgrad": 24, "fusedmatmul": 24, "fusion": [4, 9, 17, 18, 19, 21, 26, 33], "fwd_desc": 11, "fwd_pd": 11, "fwd_primit": 11, "fwd_primitive_arg": 11, "g": [5, 17, 28, 40, 56, 61], "g10": [39, 40], "g11": [39, 40], "gamma_constraint": [25, 26], "gamma_initi": [25, 26], "gamma_regular": [25, 26], "gate": 25, "gaussian": 25, "gb": 31, "gbs1": 51, "gbs2": 51, "gcc": [33, 39], "gd": 35, "gddr6": 31, "gelu": [11, 33], "gelu_erf": 24, "gelu_tanh": 24, "geluop": 11, "gen": 31, "gen9": 11, "gender": 0, "gener": [4, 5, 16, 20, 21, 23, 28, 29, 30, 31, 32, 34, 38, 39, 41, 47, 49, 52], "get": [2, 4, 7, 11, 13, 21, 28, 31, 32, 33, 34, 35, 37, 39, 40, 47, 48, 51, 54, 55, 57, 60, 63], "get_concrete_funct": 35, "get_config": 35, "get_scaled_loss": 28, "get_unscaled_gradi": 28, "get_weight": 28, "getattr": 11, "getsitepackag": [37, 38, 42, 63], "gh": 5, "ghz": 31, "gigabit": 31, "gin": 58, "git": [5, 11, 16, 33, 34, 39, 40, 47, 51, 54, 55, 57, 58, 60, 61, 62], "git_vers": [33, 38], "github": [5, 7, 8, 16, 21, 32, 34, 39, 40, 45, 47, 51, 54, 55, 57, 58, 60, 61, 62, 63], "give": [0, 35], "given": [17, 25, 29, 55], "glibcxx": 14, "glibcxx_3": 14, "global": [17, 28, 33, 62], "glorot_uniform": [25, 26], "glue_dataset": 16, "glue_dir": 16, "go": [7, 40, 41, 42], "go1": 7, "golang": 7, "gold": 31, "gomp": 32, "gomp_cpu_affin": 32, "good": [4, 19, 21, 23, 32, 34, 36], "googl": [7, 14, 16, 21, 22, 34, 57], "google_pretrained_weight": 51, "googleapi": [28, 35, 47, 49, 56], "govern": 63, "governor": 31, "gperftool": 32, "gpg": [37, 39], "gpu": [3, 4, 9, 11, 14, 15, 16, 18, 19, 20, 23, 24, 25, 27, 28, 33, 34, 38, 43, 44, 49, 63], "gpu_kernel": 11, "gpu_profil": 28, "gpudevic": 11, "gracefulli": 0, "grad": 28, "gradient": 28, "gradienttap": 28, "granular": [29, 32, 35], "graph": [4, 9, 10, 13, 15, 16, 18, 20, 23, 30, 35, 36, 44, 53, 62, 63], "graph_def": 35, "graph_opt": [17, 18, 19, 33, 47, 52, 62], "graph_pb2": 35, "graphdef": [17, 18, 35], "graphic": [37, 39, 40], "graphopt": [17, 18, 19, 47, 62], "grappler": [15, 17, 19, 58], "greater": [24, 32], "greaterequ": 24, "greatli": 28, "green": 15, "grep": 52, "group": [25, 32], "gt": [18, 33, 62], "guarante": 37, "guid": [4, 9, 11, 18, 21, 28, 31, 34, 37, 39, 40, 42, 44, 45, 52, 63], "guidelin": [1, 4, 16, 50, 63], "guidlin": 31, "gxx_linux": [14, 56], "gz": [7, 32, 49], "h": [7, 11, 14, 17, 34, 40], "ha": [2, 3, 4, 14, 18, 19, 20, 28, 30, 32, 36, 37, 40, 51, 62], "had": [28, 32], "half": [11, 28], "halv": 28, "hand": 16, "handl": [1, 13], "handwrit": [44, 45], "happen": [28, 36, 56], "harass": 0, "hard": [2, 54], "hardwar": [4, 16, 17, 19, 21, 23, 25, 29, 33, 35, 44], "harm": 0, "hasattr": [11, 33], "hasn": 54, "hat": 42, "have": [0, 18, 28, 32, 37, 38, 39, 42, 45, 49, 52], "hbm2e": 31, "hdr": [11, 34], "he": 25, "he_norm": 35, "header": 11, "headless": 60, "healthi": 0, "heap": 32, "help": [14, 19, 20, 21, 29, 32, 39, 40, 45, 52], "here": [8, 11, 14, 17, 18, 24, 27, 30, 35, 36, 39, 40, 49, 51, 54, 55, 60, 62], "heterogen": [17, 63], "heurist": 17, "high": [14, 16, 17, 28, 32, 63], "higher": [14, 15, 20, 28, 32], "highli": 28, "histori": [19, 28], "hlo": 16, "hochreit": 25, "hold": 32, "home": [7, 29, 37, 41, 42, 56], "homogen": 17, "hook": 17, "horovod": [2, 31, 37, 38, 42, 44, 51, 60], "horovodversionmismatcherror": 51, "host": [2, 3, 28, 39, 42, 47], "hour": 31, "how": [1, 5, 14, 17, 18, 27, 32, 34, 39, 40, 42, 44, 49, 58, 61, 63], "howev": [18, 21, 24, 28, 29, 30, 32, 54], "hpp": 11, "hs_to_tfg": 17, "hsp": 17, "html": [0, 5, 11, 39, 42], "html64": [7, 37], "http": [0, 2, 5, 7, 8, 16, 21, 22, 28, 32, 34, 35, 37, 38, 39, 40, 41, 42, 45, 47, 49, 51, 52, 54, 55, 56, 57, 58, 60, 61, 62, 63], "http_proxi": [2, 3], "https_proxi": [2, 3], "hub": 34, "hurt": 33, "hutter": 25, "hvd": 51, "hvd_configur": 61, "hvd_support": 61, "hyper": [29, 31, 32], "hyperparamet": 51, "hyphen": 32, "i": [0, 4, 5, 7, 9, 11, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 30, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 47, 48, 49, 51, 52, 53, 54, 55, 56, 57, 58, 60, 61, 62, 63], "i0203": 61, "i0324": 62, "i0817": 61, "i1015": 51, "i1021": 51, "i1022": 51, "icd": [37, 42], "id": [2, 30, 34], "idea": 32, "ident": [0, 28], "identif": 28, "identifi": 39, "if_not_mobil": 34, "igc": 37, "ignor": [18, 28, 34], "ii": [18, 19, 33], "iii": [18, 19], "illustr": 32, "ilov": 25, "imag": [27, 28, 35, 41, 42, 44, 49, 54], "image_classif": [61, 62], "image_nam": [2, 3], "imagenet": 22, "imageri": 0, "img_arrays_for_acc": 54, "impact": [0, 5, 14, 18, 24, 32, 56], "implement": [4, 7, 10, 16, 17, 19, 21, 23, 25, 26, 30, 32, 35, 49, 51, 63], "import": [2, 7, 11, 14, 17, 18, 19, 22, 23, 25, 26, 27, 28, 30, 32, 35, 37, 38, 39, 40, 41, 42, 47, 49, 52, 53, 56, 63], "import_graph_def": 35, "imports_graph_def": 35, "improv": [15, 16, 19, 28, 32, 36, 39, 40, 49, 62], "inappropri": 0, "incarn": 2, "incept": [15, 18, 35, 44, 49, 54], "inceptionv4": 35, "inceptionv4_fp32_pretrained_model": [35, 47], "incid": 0, "includ": [0, 7, 13, 14, 16, 17, 18, 20, 23, 40, 42, 51, 52, 53, 63], "include_subdir": 7, "inclus": 0, "incorrect": 28, "increas": [18, 28, 52], "independ": [16, 25, 29, 35], "index": [18, 32], "indic": [24, 28, 47, 62], "individu": [0, 16, 20], "inf": 28, "infer": [11, 15, 16, 17, 18, 19, 24, 28, 34, 36, 44, 45, 51, 52, 56], "infer_config": 52, "infer_fp32_vs_amp": 47, "infer_inception_v4_amp": 47, "infer_resnet50": [29, 48], "inferlist": 18, "inferlist_add": 18, "inferlist_remov": [18, 19], "infin": 28, "influenc": [21, 29, 32], "info": [17, 18, 29, 36, 40, 45, 47, 49], "inform": [0, 1, 7, 8, 16, 20, 29, 32, 33, 39, 40, 42, 45, 52, 61, 63], "infrastructur": [4, 9, 20, 63], "init": 11, "init_checkpoint": 57, "initi": [17, 20, 28, 31, 35, 39, 40], "initial_weight": 28, "innov": [4, 63], "inplac": 7, "input": [4, 11, 13, 17, 19, 20, 21, 22, 24, 25, 28, 33, 35, 62], "input_height": 53, "input_shap": [35, 49], "input_width": 53, "input_x": 35, "insert": [18, 19, 24, 35, 52], "insid": [2, 63], "inspir": 0, "instal": [2, 3, 4, 7, 9, 14, 18, 19, 21, 22, 23, 26, 27, 28, 29, 31, 32, 33, 45, 46, 47, 48, 51, 52, 54, 55, 56, 57, 60], "install_head": 40, "instanc": [0, 31], "instance_idx": 29, "instancenorm": [19, 26], "instead": [36, 37, 39, 51, 54, 55, 60], "instruct": [2, 3, 4, 7, 16, 18, 19, 21, 31, 32, 41, 42, 54, 61, 63], "insult": 0, "int": [11, 35, 40, 51], "int8": [4, 28, 31, 45, 49, 52], "integ": 29, "integr": [4, 15, 16, 30, 32, 39], "intel": [0, 1, 5, 8, 9, 11, 14, 15, 16, 17, 18, 19, 20, 21, 22, 24, 25, 26, 28, 29, 30, 36, 38, 43, 44], "intel_extension_for_tensorflow": [11, 17, 18, 19, 25, 26, 28, 29, 34, 37, 38, 39, 41, 42, 47, 49, 63], "intel_extension_for_tensorflow_lib": [11, 39], "intel_xpu": 2, "intelai": 16, "intelpython3_ful": 38, "intend": [7, 16, 63], "intent": 7, "inter": [4, 20, 35], "inter_op_parallelism_thread": 35, "interact": [0, 39], "interfac": [17, 30, 43, 63], "intermedi": [16, 28], "intern": 16, "internet": 47, "interop": 29, "interpret": 29, "intraop": 29, "introduc": [16, 29, 32, 36], "introduct": 19, "invalid": [13, 27, 32], "invent": 15, "investig": [0, 29], "invis": 0, "invok": [16, 17], "involv": 0, "io": [5, 34], "ip": 56, "ipc": [2, 3, 42, 47], "ipp": 55, "ipykernel": 54, "ipynb": [52, 54, 56], "ipython": 56, "ir": [16, 17], "irc_na": [37, 42], "is_bf16_math_mod": 24, "is_gpu_avail": 28, "isol": [37, 41, 42], "issu": [0, 1, 4, 7, 14, 18, 28, 37, 39, 40, 42, 56, 63], "item": [22, 35], "iter": [20, 31, 35, 36, 62], "itex": [0, 2, 3, 4, 8, 9, 11, 13, 14, 17, 18, 19, 20, 21, 23, 26, 27, 28, 29, 30, 31, 34, 37, 38, 39, 40, 41, 42, 46, 47, 52, 54, 62, 63], "itex_auto_mixed_precis": [16, 18, 19, 29, 33, 47], "itex_auto_mixed_precision_allowlist_add": [18, 19], "itex_auto_mixed_precision_allowlist_remov": 18, "itex_auto_mixed_precision_clearlist_add": 18, "itex_auto_mixed_precision_clearlist_remov": 18, "itex_auto_mixed_precision_data_typ": [16, 18, 19, 47], "itex_auto_mixed_precision_denylist_add": 18, "itex_auto_mixed_precision_denylist_remov": 18, "itex_auto_mixed_precision_inferlist_add": 18, "itex_auto_mixed_precision_inferlist_remov": [18, 19], "itex_auto_mixed_precision_log_path": [18, 19, 20, 33], "itex_auto_mixed_precision_unsafe_force_al": 18, "itex_bf16": 61, "itex_bf16_lar": 61, "itex_build": [39, 40], "itex_cfg": [17, 62], "itex_check_eq": 11, "itex_cpp_min_log_level": 20, "itex_disable_xla": 27, "itex_dummy_bf16": 61, "itex_dummy_bf16_lar": 61, "itex_dummy_fp32": 61, "itex_dummy_fp32_lar": 61, "itex_enable_multiple_stream": 62, "itex_enable_nextpluggable_devic": 27, "itex_fp32": 61, "itex_fp32_lar": 61, "itex_fp32_math_mod": [20, 51], "itex_gpu_wrapp": 42, "itex_layout_opt": [29, 32, 33], "itex_layout_optitex_remapperitex_auto_mixed_precisionitex_shard": 33, "itex_omp_threadpool": [3, 4, 20, 29, 35, 40], "itex_onednn_graph": [33, 52], "itex_ops_overrid": 27, "itex_optimizer_after_shard": 17, "itex_optimizer_before_shard": 17, "itex_quant": 49, "itex_remapp": 33, "itex_repo": 47, "itex_shard": 33, "itex_sync_exec": 33, "itex_tf_constant_fold": [15, 52], "itex_tile_as_devic": 20, "itex_verbos": [11, 17], "itex_vlog": 11, "itex_xpu_librari": 11, "itex_xx": 61, "itexauto_mixed_precision_opt": [18, 19], "itexdatatyp": 33, "itexgelu": 26, "itexgelugrad": 26, "itexlayernorm": 26, "itexlayernormgrad": 26, "itexlstm": 26, "itexresourceapplyadamwithweightdecai": 26, "itexrnn": 26, "its": [4, 11, 25, 28, 29, 30, 32, 37, 42, 53], "iv": [18, 19], "jammi": [37, 39], "jax": [16, 27, 30, 63], "jemalloc": 32, "jit": [4, 16, 27, 30], "jit_compil": 27, "job": [11, 20, 40], "join": [22, 32, 35], "json": [16, 35, 57], "just": [0, 4], "k8": [3, 40], "kaim": 25, "kdstindex": 11, "keep": [28, 32], "keepdim": 35, "kei": [9, 17, 20, 36, 37, 39], "kept": [26, 28], "kera": [4, 19, 25, 26, 31, 35, 51, 52, 54, 58, 63], "keras_util": [61, 62], "kerascv": 31, "keraslay": 22, "kernel": [2, 3, 9, 10, 15, 20, 22, 23, 24, 25, 28, 30, 31, 35, 37, 39, 40, 41, 42, 51, 52, 54, 56, 63], "kernel_initi": [25, 26], "kernels_experiment": 34, "keyr": 37, "kind": [0, 4, 21, 53], "kitti": 49, "kmp": 32, "kmp_affin": [29, 32, 35], "kmp_blocktim": [29, 32, 35], "knob": 29, "know": [19, 28], "knowledg": [19, 32], "known": [16, 28, 56], "kwarg": [25, 26, 35], "l": [34, 35, 40], "l28": 34, "l2loss": 24, "l_basekit_p_2024": [37, 42], "label_shap": 49, "ladder": 0, "lake": [4, 21], "lamb": [25, 51], "lambda": 25, "languag": [0, 40], "language_model": 16, "languagemodel": 51, "laptop": 14, "lar": 61, "larg": [4, 16, 20, 25, 28, 32, 35, 36, 44], "larger": [31, 32, 35, 39, 40], "last": [28, 56], "latenc": [13, 35, 47, 54], "latency_mod": 29, "later": [32, 37, 41, 42], "latest": [8, 27, 31, 34, 38, 39, 40, 42, 63], "launch": [21, 42, 54], "launcher": [4, 29, 32], "layer": [2, 9, 16, 19, 25, 28, 35, 52], "layer_0": 20, "layernorm": [19, 24, 26], "layernormgrad": 26, "layout": [13, 29, 33, 36], "layout_opt": 33, "ld": 32, "ld_library_path": 40, "ld_preload": [29, 32], "lead": [0, 16, 18], "leader": 0, "leakyrelu": 24, "learn": [0, 14, 15, 16, 19, 21, 25, 27, 29, 32, 34, 36, 44, 45, 63], "learning_r": [25, 26, 57], "learning_rate_per_gpu": 51, "learning_rate_phase1": 51, "learning_rate_phase2": 51, "least": [28, 37, 38], "leav": 32, "legaci": [27, 30, 51, 54, 55, 56, 57, 60, 61, 62], "legal": 7, "len": 35, "length": [16, 31, 51], "less": [4, 18, 19, 21, 24, 28, 35, 47], "lessequ": 24, "let": [18, 28, 34, 35], "level": [0, 14, 16, 17, 23, 24, 28, 37], "level_zero": 14, "level_zero_util": 14, "leverag": [4, 16], "lib": [2, 14, 29, 39, 40, 56], "lib64": 29, "lib_path": 40, "libgomp": 32, "libiari": 42, "libigc1": 37, "libigdfcl1": 37, "libigdgmm12": 37, "libiomp": 32, "libiomp5": [32, 40], "libitex": 40, "libitex_common": 39, "libitex_cpu": 39, "libitex_cpu_cc": [34, 40], "libitex_gpu": 39, "libitex_gpu_cc": [34, 40], "libitex_gpu_xetla": 40, "libmkl_sycl": [14, 47, 48, 51, 54, 55, 57, 60], "libomp": 39, "librari": [2, 3, 11, 14, 16, 29, 32, 37, 39, 42, 55], "library_path": 40, "libtensorflow": 40, "libtensorflow_cc": 40, "libtensorflow_framework": 40, "like": [0, 2, 7, 17, 25, 28, 32, 33, 46, 47, 57, 58], "limit": [16, 17, 32, 63], "line": [7, 28, 32, 34, 47, 56, 62], "linear": [4, 16, 19, 21, 25, 28, 30], "linearli": 25, "link": [2, 31, 40, 52], "linkstat": 11, "linux": [2, 3, 7, 29, 31, 32, 38, 39, 40, 41, 42, 52], "list": [2, 7, 11, 16, 19, 24, 27, 28, 29, 30, 32, 35, 37, 39, 40], "list_local_devic": 2, "list_physical_devic": [14, 19, 28], "littl": 18, "live": 16, "ll": [20, 24], "lld": 39, "lldb": 39, "llga": [7, 33], "llvm": [16, 39], "llvm_openmp": 40, "ln": 40, "load": [11, 28, 34, 35, 42], "load_data": [19, 28, 35], "load_ops_librari": 11, "load_pb": 35, "load_ref_result": 54, "local": [2, 3, 7, 14, 19, 29, 31, 32, 34, 35, 39, 40, 41, 42, 49, 58], "localalloc": 29, "localhost": [5, 11, 20, 41, 42], "locat": [7, 8, 39, 40, 51, 54], "lock": 13, "log": [7, 11, 18, 20, 22, 28, 33, 35, 40, 42, 47, 48, 51, 54, 55, 56, 57, 58, 60, 62], "log_everi": [55, 60], "log_file_prefix": 29, "log_path": 29, "log_step": 62, "log_warmup_step": 60, "logdir": 22, "logic": 32, "logit": 35, "logpath": 22, "long": [25, 30], "look": [2, 24, 34, 39, 40], "loop": [54, 62], "loshch": 25, "loss": [15, 18, 19, 31, 35, 44, 45, 52, 58], "loss_object": 28, "loss_scal": 28, "lossscaleoptim": 28, "low": [4, 16, 18, 21, 23, 28, 45], "lower": [4, 15, 18, 19, 21, 35, 47], "lowpropos": 49, "lr": [25, 51, 58], "lscpu": [32, 52], "lstm": 25, "lt": [31, 33, 37], "ltensorflow_cc": 40, "ltensorflow_framework": 40, "m": [5, 29, 32, 45, 46, 49, 54, 55, 58, 60], "m150": [39, 40], "m75": [39, 40], "machin": [2, 3, 14, 16, 21, 28, 29, 32, 34, 41, 42, 53, 58], "macro": 11, "made": [11, 30, 55], "mai": [0, 7, 13, 14, 16, 18, 19, 24, 28, 29, 32, 35, 36, 37, 38, 42, 54, 63], "mail": 0, "main": [5, 17, 21, 37, 39, 40, 55, 58, 60, 61], "mainli": [15, 17, 29], "maintain": [0, 7, 8, 14, 18, 21, 23, 25, 34, 36], "make": [0, 2, 3, 5, 7, 11, 16, 18, 19, 28, 30, 32, 35, 36, 39, 40, 47], "makefil": 40, "malloc": [29, 32], "malloc_conf": 29, "man": 32, "manag": 63, "mani": [16, 18, 21, 28, 29, 32, 58], "manner": 16, "manual": [5, 7, 18, 28, 29, 51, 61], "manylinux2014": [37, 41, 42], "manylinux2014_x86_64": 40, "manylinux_2_17_x86_64": 40, "map_structur": 35, "mark": 17, "mask": [25, 44], "maskrcnn": 60, "master": [32, 34, 36], "match": [16, 29, 36, 43], "matcher": 24, "math": [20, 24, 28, 37, 42], "matmul": [17, 20, 24, 26, 35, 36, 40, 49], "matrix": [36, 40], "max": [16, 33, 39, 40, 42, 47, 50, 51, 54, 55, 56, 57, 58, 60, 61, 62, 63], "max_seq_length": 57, "max_step": 55, "maxim": [4, 17, 21, 25, 33, 62], "maximum": [31, 51], "maxpool": 49, "maxpool3d": 24, "maxval": 35, "md": 21, "mean": [13, 14, 18, 25, 27, 28, 29, 32, 35, 36, 39, 40], "mechan": [4, 16, 21, 30], "media": 0, "medic": 44, "meet": [3, 25, 51, 63], "member": [0, 33], "membind": 32, "memori": [4, 9, 11, 13, 14, 15, 16, 18, 19, 21, 25, 28, 31, 36, 47, 51], "memory_limit": 2, "mention": [28, 32], "merg": 5, "messag": [28, 29], "meta": 13, "metadata_thp": 29, "metal": 44, "method": [28, 32, 45, 52], "metric": [19, 28, 35], "middl": 28, "might": [11, 39], "migrat": 7, "millisecond": 32, "mind": 16, "miniconda": 38, "miniconda3": 38, "minim": [15, 32], "minimum": [31, 39], "minor": [4, 21, 23], "minut": [25, 39, 40], "minval": 35, "miscellan": 9, "mismatch": 28, "miss": 15, "mistak": 0, "mit": 52, "mix": [4, 31, 33, 35, 44, 49], "mixed_bfloat16": 28, "mixed_float16": 28, "mixed_precis": 28, "mkdir": [2, 3, 39, 61, 62], "mkl": [7, 34, 37, 38, 39, 40, 42], "ml": 16, "mlir": 17, "mnist": [19, 28, 34, 35, 44, 58], "mnist_client": 34, "mnist_saved_model": 34, "mode": [16, 17, 20, 24, 31, 33, 39, 51, 54, 61], "model": [2, 3, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 27, 32, 33, 35, 36, 44, 45, 52, 56, 58, 62, 63], "model_base_path": 34, "model_dir": [3, 34, 55, 60, 61, 62], "model_nam": [3, 34], "model_path": 49, "model_serv": [3, 34], "model_training_util": 51, "model_typ": 61, "modelserv": 34, "moder": 0, "modern": 36, "modif": [4, 16, 30], "modifi": [5, 35, 40, 47, 51, 62], "modul": [14, 17, 29], "modular": 10, "modulenotfounderror": 14, "monitor": 14, "monolith": 16, "more": [1, 4, 7, 11, 16, 18, 19, 21, 25, 32, 34, 35, 36, 37, 39, 40, 42, 45, 51, 52, 53, 58, 61], "most": [4, 18, 19, 28, 29, 32, 47, 56], "mount": [2, 3], "move": [18, 32, 51, 55, 60], "mozilla": 0, "mpi": [37, 38, 42], "mpirun": [55, 58, 60, 61], "mrpc": 16, "mt": 31, "much": [28, 32, 35, 52], "mul": 24, "multi": [28, 32, 33, 38, 39, 51, 60, 62], "multipl": [18, 20, 32, 36, 62], "multipli": 28, "must": [5, 15, 27, 28, 35], "mutex": 13, "mutual": 29, "my": [14, 18, 19], "mybuilddir": 39, "myfil": 7, "n": [18, 24, 25, 32, 33, 38, 39, 40, 51, 53], "n02123159": 48, "na": [27, 31], "name": [2, 3, 5, 7, 11, 14, 18, 19, 20, 25, 26, 28, 30, 32, 34, 35, 44, 49, 54, 58], "name_scop": 11, "namespac": [4, 17, 21, 23, 25, 26, 33, 40], "nan": 28, "narrow": 28, "nation": 0, "nativ": [4, 15, 16, 21], "natur": 0, "ncdhw": 24, "nchw": 32, "ncore_per_inst": 29, "ndhwc": 24, "necessari": [16, 28, 37, 41, 42, 53], "necessarili": 16, "need": [4, 8, 13, 14, 16, 17, 20, 21, 23, 28, 29, 30, 34, 35, 36, 37, 38, 39, 40, 42, 47, 52, 53, 56, 60, 61, 62], "neg": [32, 35], "neglig": 28, "neither": 29, "nest": 35, "netron": 18, "network": [14, 15, 32], "neural": [4, 14, 15, 21, 32, 44, 45, 52], "new": [4, 5, 7, 8, 15, 16, 21, 23, 24, 28, 30, 32, 36, 45, 51], "newer": [15, 45, 46, 52], "newrootscop": 40, "next": [4, 16, 28, 39, 49], "next_pluggable_devic": 30, "next_pluggable_device_factori": 30, "nextplugg": 30, "nextpluggabledevic": 16, "nhwc": [20, 32], "nibabel": 55, "nic": 31, "nice": 32, "nifti": 55, "nightli": 55, "ninstanc": 29, "nn": [11, 25, 26, 33, 35, 53], "nn_op": 11, "no_proxi": [2, 3], "no_python": 29, "node": [13, 18, 20, 24, 32, 36, 38, 45, 51], "node0": 32, "node1": 32, "node_id": 29, "nolint": 7, "nolintnextlin": 7, "non": [27, 35], "none": [8, 25, 26, 28, 29, 33, 51], "nonetyp": 56, "nonlinear": 25, "nor": 29, "norm": 25, "normal": [17, 20, 25, 28, 32, 39, 47], "note": [2, 3, 5, 11, 16, 17, 18, 20, 25, 27, 28, 29, 31, 33, 34, 36, 39, 40, 47, 49, 51, 54, 58, 60, 61], "notequ": 24, "notfounderror": [14, 47, 48, 51, 54, 55, 57, 60], "noth": 11, "notic": [13, 28], "novel": 16, "now": [2, 18, 28, 32, 34], "np": [22, 25, 53, 55, 58, 60, 61], "npd": [4, 27, 30], "npz": 28, "nth": 32, "nullptr": 11, "num": [29, 32, 51], "num_accumulation_steps_phase1": 51, "num_accumulation_steps_phase2": 51, "num_channel": 53, "num_class": 35, "num_el": 11, "num_gpu": [51, 62], "num_test": 34, "num_train_epoch": 57, "num_unit": [19, 28], "numa": 31, "numactl": [29, 35], "number": [15, 20, 24, 28, 31, 32, 35, 36, 44, 45, 51, 54, 61, 62], "number_of_process": 61, "numer": 28, "numpi": [22, 25, 28, 53, 55], "nv_result": 54, "nvidia": [28, 51, 54, 55, 60], "nvme": 31, "o": [2, 22, 27, 31, 35, 37, 38, 39, 40, 42, 44, 52], "oam": 31, "object": [12, 14, 18, 28, 32, 33, 47, 48, 49, 51, 54, 55, 56, 57, 60], "oblig": 0, "obvious": 18, "occasionali": 27, "occupi": 18, "occur": 28, "ocl": 11, "ocloc": [39, 40], "off": [13, 29, 31, 33, 52, 62, 63], "offcial": 11, "offens": 0, "offer": [19, 30, 32, 49], "offici": [0, 16, 32, 44, 45, 46, 51, 54, 55, 57, 60, 61, 62], "offlin": [0, 36, 39, 40], "offononoffoff": 33, "often": [29, 37, 41, 42], "ok": 51, "omp": [4, 20, 32, 35], "omp_num_thread": [29, 35], "omp_proc_bind": 32, "omp_schedul": 32, "onboard": 32, "onc": [20, 28, 32, 36], "onconfig": [18, 19], "one": [11, 15, 20, 21, 28, 32, 39, 40, 47, 53, 55, 61], "oneapi": [2, 14, 21, 31, 34, 38, 45, 47, 48, 51, 52, 54, 55, 56, 57, 60, 61, 62, 63], "oneapi_install_path": 34, "oneccl": [2, 37, 38, 42, 51], "onednn": [9, 11, 12, 14, 15, 20, 24, 32, 33, 36, 44], "onednn_cpu_git_vers": 33, "onednn_engin": 11, "onednn_gpu_git_vers": 33, "onednn_graph": 33, "onednn_graphoverrid": 33, "onednn_stream": 11, "onednn_verbos": 11, "onednngraph": 15, "onemkl": [37, 38, 39, 40, 42], "ones": [22, 25, 26, 33, 51], "onli": [2, 4, 5, 13, 14, 16, 17, 18, 20, 21, 23, 24, 28, 29, 30, 33, 34, 36, 37, 41, 51, 54, 55, 56, 57, 60, 61, 62], "onlin": [0, 31, 63], "op": [4, 9, 10, 16, 17, 20, 21, 23, 24, 26, 27, 28, 30, 35, 40, 49, 51, 54], "op_build": 11, "op_kernel": 11, "op_requires_ok": 11, "opaqu": 30, "open": [0, 5, 7, 14, 16, 18, 21, 34, 35, 37, 47, 48, 51, 52, 54, 55, 56, 57, 60, 63], "opencl": [14, 37, 39, 40, 42], "opencv": [49, 60], "openmp": [29, 39], "openvino": 49, "openxla": 4, "openxla_support_on_gpu": 21, "oper": [4, 13, 15, 16, 18, 23, 24, 28, 32, 35, 36, 63], "opinion": 0, "opkernel": 11, "opkernelconstruct": 11, "opkernelcontext": 11, "ops_overrid": 27, "opt": [2, 3, 11, 14, 37, 39, 40, 42, 46, 58], "optim": [2, 4, 9, 14, 15, 16, 17, 18, 23, 25, 26, 28, 29, 30, 31, 32, 33, 35, 36, 37, 38, 42, 44, 45, 47, 49, 50, 51, 52, 54, 55, 60, 61, 63], "option": [2, 3, 7, 11, 18, 21, 29, 33, 35, 61, 62, 63], "order": [18, 19, 28, 29, 30, 32, 38, 43], "org": [0, 2, 7, 21, 39, 40, 49, 56], "organ": 16, "orient": 0, "origin": [4, 16, 18, 21, 23, 24, 25, 31, 36, 40, 45, 47, 49, 56], "orign": 31, "orthogon": [25, 26], "other": [0, 17, 20, 25, 28, 29, 30, 31, 32, 33, 34, 35, 37, 39, 40, 42, 56, 58, 63], "otherwis": [0, 17, 28, 33, 52, 53], "our": 29, "out": [3, 15, 28, 36, 40, 48, 51, 53, 54, 62], "outcom": 54, "outermost": 25, "output": [2, 7, 11, 13, 16, 19, 20, 24, 25, 28, 30, 31, 33, 35, 37, 39, 40, 47, 49, 52, 57], "output_dim": 35, "output_dir": [16, 55, 57, 60], "over": [18, 28, 49], "overal": [0, 32], "overhead": [13, 16, 28, 32, 35, 51], "overload": 26, "overrid": [4, 11, 18, 27, 28], "oversize_threshold": 29, "overview": 4, "own": [35, 49], "p": [2, 3, 25, 34, 41, 42, 47, 61], "pacakg": 56, "packag": [3, 27, 30, 32, 37, 38, 39, 41, 45, 51, 52, 55, 56, 60, 63], "pad": [24, 25, 53], "page": [5, 21, 22, 23, 32, 63], "paintbucket": 18, "parallel": [13, 20, 32, 35, 39], "paramet": [17, 26, 35, 47, 51], "parent": 9, "parsefromstr": 35, "part": [15, 16, 17, 32, 39, 40, 51, 60], "parti": [9, 36, 63], "particip": 0, "particular": 28, "particularli": 14, "partit": [15, 32], "pass": [11, 15, 16, 17, 28, 31, 33, 36, 49, 54, 62], "patch": [7, 34, 51, 54, 55, 57, 60, 62], "path": [2, 3, 7, 16, 18, 19, 20, 22, 29, 32, 33, 34, 37, 38, 39, 40, 42, 47, 49, 51, 52, 55, 57, 60, 61, 62], "path_to_itex": 3, "path_to_libitex_cpu_cc": 34, "path_to_libitex_gpu_cc": 34, "path_to_python_unit_test": 7, "path_to_site_packag": [37, 38, 42, 63], "path_to_tensorflow_serv": 3, "pattern": [0, 4, 15, 16, 21, 24], "pb": [18, 19, 34, 35, 47, 49], "pb_file": 35, "pbtxt": 17, "pci": [2, 30], "pcie": 31, "pdf": 25, "peak": [18, 23], "penal": 32, "peopl": 0, "per": [17, 28, 29, 31, 32, 38, 58, 62], "perf": 27, "perform": [4, 14, 15, 16, 17, 19, 20, 21, 22, 23, 24, 25, 28, 29, 32, 33, 35, 36, 39, 40, 44, 49, 51, 52, 54, 55, 60, 62, 63], "period": [0, 32], "permiss": [0, 5], "person": 0, "perspect": [29, 32], "phase": [15, 31, 36, 51], "phase1": [31, 51], "phase2": 51, "phase_2": 51, "photo": 52, "physic": [0, 30, 32, 62], "physical_devic": [14, 58], "physical_device_desc": 2, "physicaldevic": [14, 58], "pick": 7, "picker": 5, "piecewiseconstantdecai": 25, "pip": [7, 11, 14, 22, 27, 33, 34, 37, 38, 39, 40, 41, 42, 45, 46, 49, 51, 54, 55, 58, 60, 62, 63], "pip3": 41, "pip_packag": [11, 39], "pip_set_env": [51, 52, 54, 55, 57, 60, 61], "pipelin": [16, 44, 45, 52], "pjrt": [4, 16, 21, 63], "place": [4, 17, 21, 32, 40], "placement": [29, 32], "plai": 32, "plain": 36, "platform": [14, 16, 28, 32, 33, 37, 39, 40, 41, 51, 54, 55, 56, 57, 60, 61, 62], "platinum": [31, 32, 35], "pleas": [7, 11, 14, 16, 17, 21, 27, 28, 37, 39, 40, 42, 44, 45, 47, 51, 53, 55, 57, 58, 60, 61, 63], "plu": [16, 32], "plug": [34, 63], "pluggabl": [4, 10, 16, 30, 40], "pluggable_devic": 30, "pluggable_device_factori": 30, "pluggabledevic": [10, 27, 63], "plugin": [4, 10, 16, 18, 19, 21, 22, 34, 39, 58, 63], "po": 35, "point": [17, 18, 20, 28, 33, 37, 42, 47], "polici": [29, 32, 63], "polit": 0, "polymorph": 11, "pool": 4, "popular": [15, 16, 31], "port": [34, 54], "portabl": [16, 36], "posit": [0, 7], "possibl": [4, 19, 32, 35, 36, 39], "post": [0, 7, 18, 19, 24, 33], "post1": 40, "potenti": [28, 63], "power": [19, 63], "ppn": [55, 58, 60, 61], "pr": 5, "practic": [4, 28, 29], "pramet": 62, "pre": [18, 31, 33, 41, 42, 51, 56], "precis": [4, 16, 30, 31, 33, 44, 45, 49, 54, 57], "preconfigur": 39, "predict": [19, 26, 27, 28, 35, 57], "predict_batch_s": 16, "predict_fil": 57, "prefer": [29, 37, 41, 42], "prefix": 29, "preload": 32, "preop": 18, "prepack": 4, "prepend": [29, 55, 58, 60, 61], "preprocess": 60, "preprocess_data": 55, "present": [30, 54], "preserv": 20, "press": 38, "pretrain": [31, 44, 49], "pretrain_bert": 51, "pretrain_lamb": 51, "pretrain_path": 51, "pretrain_result_dir": 51, "prevent": 28, "previou": [8, 25, 32, 51], "previous": [28, 30], "primari": [17, 32], "primit": [11, 13, 20, 36], "primitive_attr": 11, "primitive_desc": 11, "principl": 18, "print": [2, 11, 19, 22, 25, 28, 29, 30, 33, 35, 37, 38, 39, 40, 41, 42, 47, 48, 51, 53, 54, 62, 63], "print_graph": 35, "printf": 51, "priorit": 18, "prioriti": [20, 33], "privaci": 0, "privat": 0, "privileg": [2, 3, 47], "problem": [14, 24, 28, 32, 56], "proc": [28, 32], "procedur": [11, 37, 41, 42], "process": [4, 7, 11, 16, 21, 28, 29, 32, 34, 51, 52], "process_per_nod": 61, "processor": [4, 21, 31, 32, 41, 47, 52, 53], "proclist": 32, "produc": 57, "product": [5, 7, 21, 34, 37], "profession": 0, "profil": [4, 9, 28, 30, 32], "profiler_demo": 22, "program": [9, 27, 32, 63], "project": [2, 5, 7, 16, 63], "prolong": [39, 40], "promot": 7, "prompt": [31, 39, 40], "promptli": 0, "prop_kind": 11, "propag": [9, 13, 16, 17], "properli": [21, 29], "properti": [17, 18, 28], "propos": [7, 25], "protect": 11, "protobuf": 52, "protocol": 49, "protocolmessag": 33, "provid": [0, 2, 4, 7, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 28, 29, 30, 31, 32, 33, 35, 36, 37, 38, 39, 40, 42, 44, 45, 49, 51, 52, 55, 60, 61, 62, 63], "proxi": 36, "prune": 35, "pseudocod": 28, "pub": 37, "public": [0, 4, 5, 11, 21, 25, 33, 34], "publish": [0, 5], "pull": [7, 34, 41, 42, 47], "pure": 31, "push": [5, 16], "put": 34, "pvc": [39, 40, 51], "pwd": [47, 62], "py": [7, 11, 16, 22, 29, 34, 35, 42, 47, 48, 49, 51, 54, 55, 56, 57, 58, 60, 61, 62], "pybind11": 60, "pycocotool": 60, "pylint": 7, "pylintrc": 7, "pypi": [2, 43, 63], "python": [2, 4, 9, 14, 19, 22, 23, 25, 26, 27, 28, 29, 30, 32, 34, 35, 37, 38, 39, 41, 42, 45, 46, 49, 51, 52, 53, 55, 56, 57, 58, 60, 61, 63], "python3": [2, 5, 16, 38, 39, 54, 56], "pythonhost": 40, "pythonpath": 61, "pytorch": [27, 30], "q1": 14, "q_model": 49, "qdq": 52, "qo": 37, "qualiti": 28, "quantiz": [4, 44], "quantizev2": 49, "queri": 28, "question": [0, 4, 36, 63], "queue": [35, 62], "quick": [4, 11, 37, 44], "quickli": [20, 28], "r": [3, 7, 14, 28, 31, 32, 44, 62], "r2": [34, 40, 62], "race": 0, "rais": 33, "rand": 53, "random": [25, 35, 53], "randomnorm": 40, "rang": [25, 28, 32, 35], "rank": [31, 55, 58, 60, 61], "rapid": [41, 47], "rare": 28, "rate": [14, 15, 18, 25, 34], "rather": 25, "ratio": 36, "raw": 58, "rb": 35, "rcfile": 7, "rcnn": 49, "re": [2, 32, 35, 46], "reach": 18, "read": [20, 28, 35, 45, 55], "readm": 61, "real": [15, 28, 36, 51, 61], "reason": [0, 28, 30], "recent": 56, "recogn": [44, 45], "recommend": [16, 20, 28, 32, 33, 34, 35, 37, 38, 39, 41, 42, 46, 52], "record": [36, 61], "recurrent_activ": [25, 26], "recurrent_initi": [25, 26], "recurs": 7, "red": 42, "reduc": [15, 16, 18, 28, 32, 36, 39, 40, 45, 51, 54, 62], "reduce_mean": 35, "ref_result_dir": 54, "refer": [2, 3, 7, 11, 14, 15, 17, 18, 19, 20, 21, 23, 28, 31, 32, 33, 34, 37, 39, 40, 42, 44, 45, 46, 47, 48, 50, 51, 52, 53, 54, 55, 56, 57, 58, 60, 61, 62, 63], "refresh": 22, "regardless": 0, "region": 32, "regist": [4, 14, 30, 45, 52], "register_": 11, "register_geluop": 11, "register_kernel_build": 11, "registr": [10, 11, 55], "registrationcent": [37, 42], "regress": 27, "regular": [25, 36], "reinstal": 51, "reject": 0, "rel": [16, 29, 51], "relat": [5, 27, 29, 34, 36], "relationship": [14, 18], "releas": [4, 14, 17, 32, 33, 34, 39, 40, 45, 54, 56], "reli": 17, "relianc": 16, "religion": 0, "relu": [4, 11, 19, 21, 24, 25, 26, 28, 35, 53], "relu6": 24, "relu_op": 11, "relu_op_functor": 11, "relubaseop": 11, "relugrad": 24, "remain": [20, 30], "remapp": [19, 24, 33], "remot": 32, "remov": [0, 11, 16, 18, 24], "reorder": [13, 36], "repeat": 18, "replac": [14, 25, 26, 27, 34, 36, 40, 51], "replica": [11, 20], "repo": [5, 31, 37, 38], "report": [0, 7, 20, 63], "repositori": [9, 16, 31, 37, 51, 55, 60], "repres": [0, 4, 16, 17, 30, 31], "represent": 15, "representative_dataset": 49, "reproduc": 31, "request": [0, 7, 63], "requir": [2, 4, 7, 11, 13, 15, 16, 21, 22, 24, 25, 28, 29, 30, 36, 38, 45], "rerun": 28, "research": 57, "reserv": 32, "reset": 54, "reshap": [19, 25, 28, 35], "resnet": [61, 62], "resnet101": 49, "resnet34": 49, "resnet50": [17, 29, 31, 44, 49, 59], "resnet50_itex": 62, "resnet_ctl_imagenet_main": 62, "resnet_v1_50": 22, "resolv": 1, "resourc": [29, 32, 56], "respect": [0, 29, 35, 51], "rest": [20, 24], "rest_api_port": 34, "restart": 38, "result": [5, 15, 16, 17, 19, 22, 27, 28, 30, 32, 33, 38, 45, 48, 53, 54, 56, 62], "result_dir": 51, "retinanet50": 49, "retrain": 28, "retriev": [28, 49], "return": [11, 17, 28, 30, 33, 35, 40], "return_sequ": 25, "return_st": 25, "reus": [32, 45], "review": 0, "rewrit": [11, 17], "rewrite_opt": 52, "rewriter_config_pb2": 52, "rewriterconfig": 52, "rewritten": 16, "rf": [34, 46, 61], "rfc": [7, 21], "right": [0, 25], "rm": [34, 40, 46, 47, 61], "rmsprop": [19, 28, 35], "role": 32, "root": [7, 39, 40, 56], "rpath": 40, "rule": 19, "run": [7, 11, 14, 16, 18, 19, 22, 24, 26, 27, 28, 29, 31, 32, 33, 35, 39, 41, 42, 63], "run_20210712212258_inst": 29, "run_20210712212258_instance_0_cores_0": 29, "run_20221009103552_inst": 29, "run_20221009103552_instance_0_cores_0": 29, "run_20221009104740_inst": 29, "run_20221009104740_instance_0_cores_0": 29, "run_20221009105044_inst": 29, "run_20221009105044_instance_0_cores_12": 29, "run_20221009105320_inst": 29, "run_20221009105320_instance_0_cores_0": 29, "run_20221009105838_inst": 29, "run_20221009105838_instance_0_cores_0": 29, "run_20221009105838_instance_1_cores_12": 29, "run_20221009105838_instance_2_cores_24": 29, "run_20221009105838_instance_3_cores_36": 29, "run_20221009105838_instance_4_cores_48": 29, "run_20221009105838_instance_5_cores_60": 29, "run_20221009105838_instance_6_cores_72": 29, "run_20221009105838_instance_7_cores_84": 29, "run_20221009110327_inst": 29, "run_20221009110327_instance_0_cores_0": 29, "run_20221009110327_instance_10_cores_40": 29, "run_20221009110327_instance_11_cores_44": 29, "run_20221009110327_instance_12_cores_48": 29, "run_20221009110327_instance_13_cores_52": 29, "run_20221009110327_instance_14_cores_56": 29, "run_20221009110327_instance_15_cores_60": 29, "run_20221009110327_instance_16_cores_64": 29, "run_20221009110327_instance_17_cores_68": 29, "run_20221009110327_instance_18_cores_72": 29, "run_20221009110327_instance_19_cores_76": 29, "run_20221009110327_instance_1_cores_4": 29, "run_20221009110327_instance_20_cores_80": 29, "run_20221009110327_instance_21_cores_84": 29, "run_20221009110327_instance_22_cores_88": 29, "run_20221009110327_instance_23_cores_92": 29, "run_20221009110327_instance_2_cores_8": 29, "run_20221009110327_instance_3_cores_12": 29, "run_20221009110327_instance_4_cores_16": 29, "run_20221009110327_instance_5_cores_20": 29, "run_20221009110327_instance_6_cores_24": 29, "run_20221009110327_instance_7_cores_28": 29, "run_20221009110327_instance_8_cores_32": 29, "run_20221009110327_instance_9_cores_36": 29, "run_20221009110849_inst": 29, "run_20221009110849_instance_0_cores_0": 29, "run_20221009110849_instance_1_cores_11": 29, "run_20221009110849_instance_1_cores_24": 29, "run_20221009110849_instance_2_cores_22": 29, "run_20221009110849_instance_2_cores_48": 29, "run_20221009110849_instance_3_cores_33": 29, "run_20221009110849_instance_3_cores_72": 29, "run_20221009111034_instance_0_cores_0": 29, "run_20221009111239_instance_0_cores_24": 29, "run_20221009111753_inst": 29, "run_20221009111753_instance_0_cores_0": 29, "run_20221009111951_inst": 29, "run_20221009111951_instance_0_cores_0": 29, "run_20221009112720_instance_0_cores_0": 29, "run_20221009112905_instance_0_cores_0": 29, "run_20221009112956_instance_0_cores_0": 29, "run_classifi": 16, "run_inf": 35, "run_jupyt": 52, "run_pretraining_lamb": 51, "run_squad": [51, 57], "runner": 61, "runtim": [16, 18, 23, 25, 27, 28, 32, 36, 37, 39, 40, 51, 63], "safe": [13, 18, 33, 63], "sai": [28, 51], "same": [5, 7, 14, 20, 21, 23, 24, 25, 28, 29, 30, 31, 32, 33, 34, 35, 36, 39, 40, 45, 53], "sampl": [2, 22, 31, 35, 45, 52, 54], "samsung": 31, "saniti": [7, 63], "sapphir": [41, 47], "satisfi": [13, 23], "save": [5, 11, 17, 29, 33, 49, 57], "save_checkpoint_step": 51, "save_json_data": 35, "saved_model": 34, "savedmodel": 49, "scalabl": [4, 21, 31, 34, 41, 47], "scale": [4, 25, 26, 31, 35, 62], "scaled_gradi": 28, "scaled_loss": 28, "scenario": [4, 13, 20, 21, 23, 32, 33], "schedul": [13, 16, 25, 29, 32, 35], "schmidhub": 25, "scope": [17, 40], "scratch": [28, 51], "scratchpad": [11, 13], "scratchpad_mem": 11, "scratchpad_mod": 11, "screen": 47, "script": [5, 21, 22, 27, 32, 39, 40, 42, 47, 49, 51, 53, 55, 56, 60, 61], "sdp": 29, "seamless": [4, 30], "search": [7, 29], "sec": [31, 35, 51, 62], "second": [32, 35, 52, 61, 62], "section": [14, 28, 32, 37, 39, 40, 49], "secur": 0, "see": [0, 1, 2, 4, 7, 14, 16, 22, 25, 28, 29, 32, 34, 36, 37, 39, 52, 61, 63], "seed": 60, "seen": 32, "segment": [31, 44, 60], "select": [14, 28, 29, 30, 33, 54, 63], "self": 35, "semant": [17, 20, 25], "send": 16, "separ": [11, 14, 23, 24, 28, 31, 32, 38, 39, 63], "seq": 16, "sequenc": [31, 51, 54], "sequenti": 35, "seri": [0, 16, 32, 33, 39, 40, 42, 45, 47, 50, 51, 52, 54, 55, 56, 57, 58, 60, 61, 62, 63], "serial": 35, "seriesintel": 47, "seriesne": 47, "seriessupport": 47, "seriou": 0, "serv": [4, 30], "serval": 27, "server": [5, 31, 39, 40, 42], "servic": 55, "serving_plugin": 34, "session": [40, 52], "set": [0, 2, 4, 7, 11, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 27, 31, 32, 33, 35, 37, 38, 40, 42, 47, 51, 52, 57, 63], "set_config": [17, 18, 19, 47, 62], "set_env_cpu": [47, 48, 56], "set_env_gpu": [47, 48, 56], "set_global_polici": 28, "set_log_device_plac": 22, "set_scratchpad_mod": 11, "set_sess": 52, "set_weight": 28, "setup": [38, 41, 43, 45], "setvar": [14, 37, 42, 46, 58], "sever": [4, 16, 21, 29, 31, 32, 39, 40, 44, 61], "sex": 0, "sexual": 0, "sh": [2, 3, 5, 14, 34, 37, 38, 39, 40, 42, 46, 47, 48, 51, 52, 54, 55, 56, 57, 58, 60, 61, 63], "shape": [11, 13, 16, 17, 19, 25, 28, 30, 35, 36, 53], "shard": [4, 17, 21, 33], "sharding_config": [17, 62], "shardingconfig": [17, 62], "share": [7, 14, 32, 37, 47, 48, 51, 54, 55, 57, 60], "short": [16, 25, 28], "shoul": 40, "should": [2, 3, 5, 7, 22, 27, 28, 32, 34, 35, 37, 38, 40, 41, 42, 45, 51, 57, 62], "show": [5, 14, 16, 18, 27, 28, 31, 35, 39, 40, 42, 44, 45, 47, 49, 50, 51, 52, 54, 55, 56, 57, 60, 61, 62], "showcas": [16, 31], "shown": [2, 3, 15, 22, 24, 29, 51, 54, 55, 60], "shuffl": 28, "sigmoid": [24, 25, 26], "sign": [25, 37], "signific": [4, 7, 18], "significantli": [4, 28], "signoff": 51, "similar": [19, 32], "simpl": [4, 21, 23, 28, 40], "simpli": [28, 30, 62], "simplifi": 45, "simultan": [31, 42], "sinc": [4, 14, 28, 32, 36, 42], "singl": [0, 4, 7, 15, 20, 21, 24, 31, 51, 60, 61], "single_l2_loss_op": 62, "site": [5, 8, 37, 38, 39, 42, 56, 63], "situat": [20, 33], "size": [0, 20, 25, 28, 29, 31, 51, 58, 62], "skip": [7, 28, 29, 38], "skip_cross_node_cor": 29, "skip_ev": 62, "sle": 42, "sleep": 32, "slowdown": 16, "slower": [18, 19, 28, 35], "slowli": 28, "small": [13, 25, 28, 29, 32, 35], "sn850x": 31, "snapshot": 39, "snippet": 61, "so": [14, 16, 19, 28, 29, 32, 33, 34, 39, 40, 47, 48, 51, 54, 55, 56, 57, 58, 60], "social": 0, "socio": 0, "socket": [31, 32, 38, 62], "softmax": [18, 19, 28], "softwar": [2, 16, 38, 43, 45, 52, 53, 58], "sole": 32, "solut": [4, 14, 15, 21, 27, 30], "solv": [28, 56], "some": [2, 11, 18, 19, 26, 28, 29, 32, 39, 40, 49, 51, 58], "sometim": 7, "sort": [0, 16], "sourc": [2, 3, 4, 7, 11, 16, 17, 21, 37, 38, 42, 43, 46, 47, 48, 52, 55, 56, 58, 60, 63], "sp4": [31, 42], "sp5": 42, "space": [0, 32, 63], "sparse_categorical_crossentropi": [19, 28], "sparsecategoricalaccuraci": [28, 35], "sparsecategoricalcrossentropi": [28, 35], "special": [16, 19, 23, 28, 39, 40], "specif": [4, 16, 28, 30, 32, 33, 34, 37, 42, 61, 63], "specifi": [0, 3, 11, 21, 24, 28, 29, 32, 34, 39, 40, 49], "sped": 28, "speed": [15, 16, 18, 32, 44, 45], "speedup": [16, 31, 52, 62], "spend": 28, "split": [17, 18, 35], "squad": [31, 51, 57], "squad_dir": 57, "squad_vers": 51, "src": [7, 11, 14, 17, 34, 39], "src_mem": 11, "src_tensor": 11, "ssd": [31, 49], "ssdsc2kg960g8": 31, "st": [3, 40], "stabil": [19, 28], "stabl": [25, 28, 44, 63], "stable_diffusion_accuraci": 54, "stable_diffusion_infer": 54, "stable_diffussion_infer": 54, "stablehlo": 16, "stack": [31, 42, 43], "stage": [16, 52], "stage_num": [17, 62], "stall": 32, "standard": [7, 25], "standard_op": 40, "start": [2, 3, 14, 21, 22, 28, 29, 34, 35, 63], "startup": [39, 40], "stat": 22, "static": 32, "statist": 49, "statu": [0, 11, 19, 40], "status_msg": 40, "statusuniqueptr": 11, "std": [11, 40], "stdout": [7, 29], "steal": 35, "step": [3, 16, 17, 18, 25, 28, 31, 32, 34, 36, 44, 45, 51, 55, 58, 60, 62], "steps_per_epoch": [35, 60], "steps_per_loop": 62, "still": 28, "stock": [14, 16, 23, 24, 28, 30, 37, 38, 41, 42, 45, 49, 51, 54, 55, 56, 57, 60, 61, 62, 63], "stop": [22, 32], "storag": [16, 28, 31, 35, 47, 49, 56], "store": 36, "strategi": 32, "stream": [13, 27, 54, 62], "stream_executor": 28, "streamexecutor": [10, 30], "streamlin": [4, 21, 34], "strictli": 25, "stride": 53, "string": [18, 28, 29, 39, 40], "stringop": 34, "strong": 18, "structur": [4, 19, 29, 32], "sub": [9, 14, 18, 19, 32, 33], "subgraph": [15, 16], "submit": [5, 7, 63], "subsequ": [18, 19, 28, 32, 54], "subystem": 37, "succe": 36, "success": [48, 53, 54, 62], "successfulli": [14, 34, 38, 39, 40, 42, 62], "sudo": [7, 34, 37, 39, 40, 42], "suffici": [28, 35], "suggest": [56, 62], "sum": 35, "summari": [51, 63], "super": 35, "suppli": 35, "support": [4, 7, 13, 14, 15, 16, 17, 18, 19, 22, 24, 27, 28, 29, 30, 32, 33, 37, 39, 40, 41, 42, 45, 47, 52, 61, 62], "suppos": [32, 51], "sure": [3, 11, 28, 35, 37, 39, 40], "suse": [31, 42], "sustain": 0, "sw": 37, "swish": [19, 24], "switch": [4, 5, 27, 32, 35, 39], "sy": 53, "sycl": 14, "sycl_runtim": [14, 28], "symbol": 40, "sync": 33, "system": [14, 21, 30, 31, 32, 34, 35, 38, 39, 40, 56], "t": [2, 5, 11, 13, 17, 18, 20, 28, 29, 31, 36, 49, 54, 56], "tab": 22, "tabl": [18, 28, 29, 30, 31, 49], "tag": 5, "take": [0, 11, 16, 24, 28, 29, 32, 34, 35, 38, 51], "tanh": [24, 25, 26], "tape": 28, "tar": [3, 7, 32, 49], "target": [3, 16, 17, 39, 40], "task": [11, 20, 32, 61], "task_nam": 16, "taskset": 29, "tbb": 42, "tdp": 31, "team": [7, 54], "techniqu": [15, 28], "technologi": [16, 45], "tee": [29, 37, 51, 62], "tell": 14, "templat": 11, "temporari": 13, "tensor": [11, 16, 25, 28, 30, 40, 53], "tensorboard": [22, 63], "tensorflow": [5, 8, 9, 10, 11, 13, 14, 15, 16, 17, 20, 22, 24, 25, 26, 27, 28, 29, 30, 31, 32, 36, 38, 43, 44, 46, 47, 48, 50, 51, 53, 54, 55, 56, 57, 58, 60, 61, 62], "tensorflow2": [51, 58, 60], "tensorflow2_keras_mnist": 58, "tensorflow_doc": 56, "tensorflow_hub": 22, "tensorflow_model_serv": [3, 34], "tensorflow_plugin": 34, "tensorflow_serv": [3, 34], "tensorflow_src": 40, "term": [0, 25, 30, 63], "termin": 38, "test": [9, 19, 22, 28, 34, 35, 38, 44, 55, 56], "test_accuraci": 28, "test_dataset": 28, "test_func": 28, "test_scor": [19, 28], "test_step": 28, "text": [18, 31, 44], "text2imag": [31, 44], "tf": [11, 14, 15, 19, 22, 25, 26, 27, 28, 29, 30, 33, 35, 37, 39, 40, 41, 42, 51, 52, 53, 62], "tf2": [49, 51, 56], "tf32": [20, 31, 51], "tf_auto_jit_flag": 27, "tf_auto_mixed_precision_graph_rewrite_allowlist_add": 18, "tf_auto_mixed_precision_graph_rewrite_allowlist_remov": 18, "tf_auto_mixed_precision_graph_rewrite_clearlist_add": 18, "tf_auto_mixed_precision_graph_rewrite_clearlist_remov": 18, "tf_auto_mixed_precision_graph_rewrite_denylist_add": 18, "tf_auto_mixed_precision_graph_rewrite_denylist_remov": 18, "tf_auto_mixed_precision_graph_rewrite_inferlist_add": 18, "tf_auto_mixed_precision_graph_rewrite_inferlist_remov": 18, "tf_auto_mixed_precision_graph_rewrite_level": 18, "tf_auto_mixed_precision_graph_rewrite_log_path": 18, "tf_bert_finetune_": 51, "tf_bert_pretraining_lamb_": 51, "tf_check_ok": 40, "tf_code": 40, "tf_compatible_vers": 33, "tf_copt": [11, 34], "tf_cpp_max_vlog_level": 20, "tf_cpp_min_log_level": 20, "tf_cuda_librari": 34, "tf_enable_onednn_opt": 29, "tf_getcod": [11, 40], "tf_hub": 22, "tf_include_path": 40, "tf_kera": 27, "tf_loadpluggabledevicelibrari": 40, "tf_messag": 40, "tf_newopdefinitionbuild": 11, "tf_newstatu": [11, 40], "tf_num_interop_thread": 62, "tf_num_intraop_thread": 62, "tf_ok": [11, 40], "tf_opdefinitionbuild": 11, "tf_opdefinitionbuilderaddattr": 11, "tf_opdefinitionbuilderaddinput": 11, "tf_opdefinitionbuilderaddoutput": 11, "tf_opdefinitionbuildersetshapeinferencefunct": 11, "tf_registeropdefinit": 11, "tf_serv": 34, "tf_statu": 40, "tf_use_legacy_kera": [27, 51, 54], "tf_ver": 2, "tf_xla_auto_jit": [16, 27, 30], "tf_xla_flag": [16, 27, 30], "tf_xla_use_device_api": [16, 30], "tfa": [25, 26, 55], "tfcc_path": 40, "tfd": 61, "tfg": 17, "tfg_optimizer_hook": 62, "tfg_to_h": 17, "tfhub": 22, "tfrecord": [51, 55, 61], "tfx": 21, "than": [19, 25, 28, 32, 35, 37, 42, 47, 53, 58], "thei": [0, 18, 28, 29, 32], "them": [16, 18, 21, 28, 29, 32, 34, 56, 61], "therefor": [28, 32], "thereof": 16, "thi": [0, 2, 3, 4, 5, 11, 13, 14, 16, 17, 18, 19, 20, 21, 23, 24, 25, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 38, 39, 40, 42, 45, 46, 49, 50, 51, 52, 53, 55, 57, 60, 62, 63], "thing": 21, "think": 28, "third": [9, 36, 63], "third_parti": [7, 9, 34], "those": [0, 16, 18, 19, 34, 61], "though": 39, "thrash": 32, "thread": [4, 13, 20, 29, 31, 32, 33, 42], "threadpool": [3, 20, 40], "threaten": 0, "three": [4, 21, 22, 23, 29], "through": [0, 27, 28, 32, 35, 39, 40, 55, 63], "throughput": [31, 47, 51, 54], "throughput_mod": 29, "throughput_train": 51, "thu": 32, "tiger_cat": 48, "tightli": 30, "tile": [17, 20, 33, 51, 58, 60, 61, 62], "time": [0, 4, 11, 14, 16, 18, 19, 20, 21, 22, 28, 31, 32, 35, 39, 40, 45, 49, 51], "timehistori": [61, 62], "tip": [11, 20, 32, 34], "tmp": 34, "todai": 30, "togeth": 32, "toggl": 33, "toi": 28, "token": [54, 56], "too": [18, 28, 37, 42], "tookit": [39, 40], "tool": [7, 9, 11, 14, 18, 32, 36, 37, 38, 39, 40, 42, 63], "toolchain": 39, "toolkit": [14, 31, 37, 38, 45, 47, 58, 63], "top": 27, "topic": 4, "topologi": [21, 29, 32], "total": [31, 32, 35, 49, 51, 58], "total_loss": 51, "total_tim": 35, "total_training_step": 51, "tour": 63, "tout": 24, "toward": 0, "tpl": 7, "tpost": 24, "tpu": 49, "trace": 22, "traceback": 56, "track": [22, 56], "train": [2, 14, 17, 18, 21, 24, 25, 26, 27, 29, 34, 35, 37, 38, 42, 43, 44, 47, 51, 52, 57, 59, 63], "train_accuraci": 62, "train_and_ev": 61, "train_batch_s": [57, 60], "train_batch_size_phase1": 51, "train_batch_size_phase2": 51, "train_dataset": 28, "train_epoch": 62, "train_fil": 57, "train_horovod": 58, "train_loss": [51, 62], "train_maskrcnn": [55, 60], "train_step": [28, 51, 62], "trainabl": [25, 35], "trainable_vari": 28, "trainer": 61, "trainingop": 24, "transfer": 52, "transform": [24, 25], "translat": [0, 39, 40], "transpar": [4, 21], "transpos": [24, 26], "travers": 36, "treat": 20, "tree": [39, 40], "tri": 56, "tricki": 28, "trigger": [5, 19, 33], "troll": 0, "true": [11, 16, 22, 25, 26, 28, 29, 30, 33, 35, 40, 51, 57, 62], "truncat": 34, "try": [11, 21, 29, 45, 49, 52], "ttt": 31, "tumor": 55, "tune": [31, 33, 45, 51], "tupl": 35, "turbo": 31, "turn": [17, 63], "tutori": 56, "two": [4, 13, 14, 19, 21, 23, 28, 32, 35, 39, 47, 51, 54, 55, 60], "txt": [16, 18, 37, 42, 54, 57, 62], "type": [4, 7, 11, 14, 18, 20, 21, 29, 31, 33, 38, 39, 40, 47, 49], "type_infer": 17, "typeconstraint": 11, "typeerror": 56, "typenam": 11, "typic": [4, 21, 23, 28, 32], "u": [0, 22, 29, 42], "ubuntu": [2, 31, 34, 39, 40, 41, 42], "ubuntu22": 56, "ubuntu_vers": 2, "uma": 32, "unaccept": 0, "uncased_l": 51, "unchanged_shape_fn": 11, "undef": 11, "undefin": [2, 30], "under": [17, 23, 26, 29, 33, 39, 52], "understand": 36, "undesir": 29, "unet": [31, 44], "unet_3d_med": 55, "unexpect": 51, "unifi": [21, 29, 37], "uniform": [4, 16, 21, 30, 35], "uniniti": 17, "uninstal": [11, 51, 60], "unit": [19, 25, 28, 32, 35], "unknown": [14, 28], "unkown": 27, "unless": 33, "unmodifi": 16, "unnecessari": [24, 28, 32], "unoptim": 36, "unordered_map": 11, "unprofession": 0, "unsafe_force_al": 18, "unscal": 28, "unshard": 17, "unsolicit": 0, "unspecifi": 29, "until": [18, 32], "unwelcom": 0, "unzip": 40, "up": [18, 22, 28, 32, 37, 40, 44, 51, 54, 57], "updat": [2, 18, 27, 28, 37, 38, 39, 40, 41, 42, 62], "update_st": 28, "upenn": 55, "upgrad": [14, 37, 38, 41, 42, 45, 46, 49, 55, 60, 63], "upon": 55, "upstream": [14, 18], "url": [49, 54, 56], "us": [0, 2, 3, 4, 5, 7, 13, 14, 15, 16, 18, 19, 20, 22, 23, 24, 25, 26, 28, 31, 32, 33, 36, 37, 38, 39, 40, 42, 44, 46, 47, 49, 50, 51, 52, 53, 55, 56, 57, 60, 63], "usag": [4, 14, 16, 21, 32, 33, 35, 44], "use_bia": [25, 26], "use_default_alloc": 29, "use_itex_shard": 62, "use_logical_cor": 29, "use_mytrain": 51, "use_synthetic_data": [60, 62], "use_tf_funct": 62, "use_tf_while_loop": 62, "use_tpu": 57, "use_xla": 51, "usecyclespersecondtim": [4, 21, 22, 28], "user": [4, 5, 7, 11, 13, 19, 20, 21, 23, 27, 30, 37, 39, 40, 41, 42, 43, 47, 54, 63], "usr": [7, 29, 37, 39], "usual": 18, "ut": 7, "util": [4, 9, 11, 14, 16, 21, 23, 29, 31, 32, 35, 56, 62], "v": [2, 3, 16, 18, 34, 38, 40, 42, 46, 47], "v0": [31, 33, 38], "v1": [35, 49, 51, 52, 57, 63], "v100": 51, "v1_8": [35, 47], "v2": [15, 31, 33, 38, 42, 49, 51, 61, 63], "v3": [15, 44], "v4": [18, 35, 44], "val_accuraci": 28, "val_loss": 28, "valid": [8, 33], "validation_split": [19, 28, 35], "valu": [15, 17, 18, 20, 25, 28, 29, 31, 32, 33, 61], "valueerror": 33, "var": [2, 14, 34, 38, 39, 40, 42], "vari": 27, "variabl": [2, 4, 13, 15, 16, 19, 21, 22, 23, 24, 25, 27, 28, 30, 32, 34, 35, 38, 40, 52], "variable_dtyp": 28, "varianc": 25, "varibl": 51, "varieti": 44, "variou": 16, "ve": [39, 40], "vector": 40, "venv": [46, 55, 58, 60], "verbos": [11, 19, 20, 28, 29, 30, 35], "veri": [15, 28, 51], "verifi": [38, 39, 40, 44, 51, 54, 55, 56, 57, 60, 61, 62], "version": [0, 2, 11, 14, 16, 27, 28, 31, 32, 37, 38, 39, 40, 41, 42, 45, 46, 51, 56], "versu": [19, 32], "via": [0, 4, 11, 17, 27, 30, 31, 35, 44, 62, 63], "view": 8, "viewer": 22, "viewpoint": 0, "violat": 0, "virtual": [39, 40, 51, 52, 54, 55, 56, 57, 60, 61, 62], "virtual_env": 29, "visibl": [0, 2, 11, 34], "vision": 30, "visit": 63, "vnni": 52, "vocab": [16, 57], "vocab_fil": [16, 57], "void": 11, "volum": 55, "vulner": 63, "vz": 40, "w": [28, 31, 35, 44], "wa": [0, 29, 32, 33, 39, 40], "wai": [0, 16, 19, 28, 30, 34, 36, 38], "wait": 32, "want": [3, 5, 7, 28, 29, 37, 39, 40, 42, 51, 54, 57, 60], "warm": [22, 35], "warmup": 35, "warmup_step": 55, "warmup_steps_phase1": 51, "warmup_steps_phase2": 51, "warn": [28, 29, 40, 51], "wd": [25, 31], "wd_black": 31, "we": [0, 2, 7, 11, 24, 27, 28, 31, 32, 33, 34, 35, 38, 39, 40, 45, 46, 47, 49, 51, 52, 54, 55, 56, 57, 60, 61, 63], "weak": 31, "web": [5, 56], "websit": [45, 63], "weight": [4, 13, 25, 28, 51, 53, 62], "weight_decai": [25, 26], "welcom": [0, 7, 63], "well": [0, 2, 8, 11, 21, 26, 28, 29, 30, 31, 32, 51], "were": [0, 16, 29, 32], "wether": 27, "wget": [2, 7, 32, 35, 37, 39, 40, 42, 47, 49, 56, 58], "what": [0, 14, 28], "wheel": [2, 38, 39], "when": [0, 5, 14, 17, 19, 24, 27, 28, 29, 32, 34, 35, 36, 37, 39, 40, 51, 52, 55, 56, 60], "where": [25, 28, 31, 32, 39, 49], "wherea": 61, "wherebi": 32, "whether": [24, 29, 32], "which": [0, 4, 7, 9, 13, 14, 15, 16, 17, 18, 19, 20, 24, 28, 29, 30, 32, 33, 35, 36, 37, 39, 40, 42, 45, 46, 52, 57], "while": [16, 21, 28, 31, 32, 33, 34, 39, 48, 53, 56], "whitespac": 51, "whitlei": 31, "whl": [2, 11, 39, 40, 63], "whole": [18, 20, 33, 51], "whole_seq_output": 25, "whose": 18, "why": 0, "wide": [14, 25, 36, 44], "wiki": 0, "wiki_onli": 51, "wikicorpus_en": 51, "wikipedia": [31, 32, 51], "wish": 39, "within": [0, 15, 25, 30, 37, 51], "without": [0, 4, 16, 18, 20, 21, 23, 28, 30, 31, 39, 40, 44, 52, 56, 63], "withsum": 24, "wl": 40, "wno": 34, "won": [5, 29, 36], "work": [1, 4, 7, 14, 15, 19, 20, 21, 27, 28, 29, 32, 35, 36, 40, 42, 45, 49, 52], "worker": 28, "workflow": 16, "workload": [2, 4, 16, 32, 35, 44, 52, 60, 63], "workspac": [2, 3, 34], "world": 28, "wors": 47, "would": [28, 37, 39, 61], "wrap": 28, "wrap_funct": 35, "wrapper": [28, 42], "write": [5, 7, 16, 19], "written": [0, 7, 27], "wrong": [39, 40], "ws1": 47, "wu": 25, "www": [0, 21, 42], "x": [11, 19, 25, 26, 28, 31, 39, 40, 47, 53, 58], "x15": 14, "x710": 31, "x86_64": [38, 39, 40], "x_test": [19, 28, 35], "x_train": [19, 28, 35], "xe": 31, "xeon": [4, 21, 31, 32, 35, 39, 40, 41, 44, 47], "xfd": 11, "xla": [4, 16, 27], "xla_global_id": 2, "xpu": [2, 4, 11, 14, 17, 19, 22, 25, 26, 28, 30, 33, 37, 38, 43, 45, 46, 47, 48, 49, 53, 54, 55, 58, 60], "xpu_force_sync": 33, "xpu_lib_path": 40, "xpuautoshard": [4, 33, 44], "xx": [34, 61], "xxx": [7, 52, 56], "xxxx": [58, 61], "xxxxx": [34, 51, 62], "xxxxxx": 11, "xxxxxxxx": 52, "xzf": 7, "xzvf": 32, "y": [11, 25, 26, 28, 35, 37, 39, 40, 47, 58, 63], "y_test": [19, 28, 35], "y_train": [19, 28, 35], "yaml": 61, "ye": [19, 38], "you": [2, 3, 4, 5, 7, 8, 11, 13, 14, 16, 17, 18, 20, 21, 22, 23, 28, 29, 30, 31, 32, 33, 34, 35, 37, 38, 39, 40, 41, 42, 45, 46, 47, 48, 49, 51, 52, 53, 54, 55, 56, 57, 60, 61, 62], "your": [2, 3, 5, 7, 14, 27, 30, 32, 34, 35, 37, 38, 39, 40, 41, 42, 46, 47, 49, 51, 52, 54, 56, 62, 63], "your_script": 29, "your_script_arg": 29, "yourself": 29, "yuxin": 25, "yyi": 52, "yym": 58, "yyyi": 58, "z": [40, 58], "ze_api": 14, "ze_enable_tracing_lay": [4, 21, 22, 28], "zero": [14, 25, 26, 28, 37], "zip": 28, "zoo": 44, "zxvf": 49, "zzz": 7, "zzzz": 58}, "titles": ["Contributor Covenant Code of Conduct", "Security Policy", "Intel\u00ae Extension for TensorFlow* Docker Container Guide", "Intel\u00ae Extension for TensorFlow* Serving - Docker Container Guide", "Welcome to Intel\u00ae Extension for TensorFlow* documentation", "Online Documentation Build Guide", "Welcome to Intel \u00ae Extension for TensorFlow* documentation!", "Contributing guidelines", "Releases", "Directory Tree Structure", "Extension Design", "How to write custom op", "Optimizations Design", "oneDNN object cache optimization", "Frequently Asked Questions", "INT8 Quantization", "OpenXLA", "XPUAutoShard on GPU [Experimental]", "Tune Advanced Auto Mixed Precision", "Advanced Auto Mixed Precision", "Environment Variables", "Features", "GPU Profiler", "Infrastructure", "Graph fusion", "Customized Operators", "Operators Override", "Keras 3 Overview", "Keras Mixed Precision", "Launch Script User Guide", "NextPluggableDevice Overview", "Performance Data", "Practice Guide", "Python APIs", "Install TensorFlow Serving with Intel\u00ae Extension for TensorFlow*", "Selecting Thread Pool in Intel\u00ae Extension for TensorFlow* CPU [Experimental]", "Online Weight Prepack", "<em>Experimental:</em> Intel\u00ae Arc\u2122 A-Series GPU Software Installation", "Conda Environment Installation Instructions", "Overview", "Intel\u00ae Extension for TensorFlow* for C++", "Intel CPU Software Installation", "Intel XPU Software Installation", "Installation Guide", "Examples", "Accelerate AlexNet by Quantization with Intel\u00ae Extension for Tensorflow*", "Common Guide for Running", "Speed up Inference of Inception v4 by Advanced Automatic Mixed Precision on Intel CPU and GPU via Docker Container or Bare Metal", "ResNet50 Inference on Intel CPU and GPU", "Intel\u00ae Extension for Tensorflow* Model Quantization API Example", "Accelerate Deep Learning Training and Inference for Model Zoo Workloads on Intel GPU", "Accelerate BERT-Large Pretraining on Intel GPU", "Quantize Inception V3 by Intel\u00ae Extension for Tensorflow* on Intel\u00ae Xeon\u00ae", "Quick Example on Intel CPU and GPU", "Stable Diffusion Inference for Text2Image on Intel GPU", "Accelerate 3D-Unet Training w/o horovod for medical image segmentation on Intel GPU", "BERT Training for Classifying Text on Intel CPU and GPU", "FP8 BERT-Large Fine-tuning for Classifying Text on Intel GPU", "Distributed Training Example with Intel\u00ae Optimization for Horovod* on Intel\u00ae GPU", "Refer to train_resnet50", "Accelerate Mask R-CNN Training on Intel GPU", "Resnet50 train on Intel GPU", "Accelerate ResNet50 Training by XPUAutoShard on Intel GPU", "Intel\u00ae Extension for TensorFlow*", "Welcome to Intel \u00ae Extension for TensorFlow* documentation!"], "titleterms": {"1": [0, 11, 31, 34, 37, 40], "1550": 31, "17": 39, "170": 31, "1x": 31, "2": [0, 11, 34, 37, 40], "3": [0, 11, 27, 37], "3d": [31, 55], "4": [0, 11, 31, 37], "4x": 31, "5": 31, "6": 11, "7": 11, "8": 11, "9": 11, "A": 37, "By": 37, "For": [39, 40], "If": 61, "That": 2, "With": 62, "acceler": [45, 50, 51, 55, 60, 62], "access": [2, 32], "accuraci": [31, 54, 57], "activ": 26, "adamw": 26, "adamwithweightdecayoptim": 25, "add": 11, "addit": [31, 39], "advanc": [18, 19, 21, 23, 29, 47, 52], "ai": 31, "alexnet": 45, "all": 29, "alloc": [29, 32], "amp": [19, 21, 47], "api": [17, 18, 20, 21, 23, 33, 47, 48, 49, 54, 62], "appli": [49, 58, 61], "arc": 37, "architectur": [23, 30], "ask": 14, "attribut": [0, 18], "auto": [18, 19, 20, 21], "automat": 47, "automixedprecisionopt": 33, "b0": 31, "b3": 31, "backend": 20, "background": [18, 45, 52], "ban": 0, "bare": [41, 42, 47, 50], "base": [39, 40, 42, 45, 46], "basic": [24, 29], "bazel": [7, 39, 40], "bert": [31, 51, 56, 57], "bf16": 57, "binari": [2, 3, 63], "boost": 52, "build": [2, 3, 5, 11, 14, 28, 34, 39, 40, 41, 42], "c": [7, 34, 40], "cach": 13, "case": 27, "cc": 40, "center": 31, "chang": [8, 51, 54, 55, 57, 60, 61], "channel": 63, "check": [30, 42, 52, 58], "clang": 39, "classifi": [56, 57], "clone": [47, 58], "cnn": 60, "code": [0, 7, 17, 19, 39, 40, 51, 53, 54, 55, 56, 57, 58, 60, 61, 62], "command": [51, 58, 61, 62], "common": [29, 39, 40, 46], "compar": 47, "compat": 63, "compil": 39, "compressor": 49, "conda": [38, 39, 40], "conduct": 0, "config": [20, 33], "configproto": 33, "configur": [18, 20, 31, 32, 39, 40, 47, 52], "constant": 52, "contain": [2, 3, 41, 42, 47, 50], "content": 32, "contribut": [7, 63], "contributor": 0, "control": 29, "converg": 51, "convolut": 13, "core": 29, "correct": 0, "count": 58, "coven": 0, "cpu": [21, 32, 35, 39, 40, 41, 42, 47, 48, 52, 53, 54, 56, 61, 63], "creat": [5, 39, 40, 58], "current": 30, "custom": [2, 11, 19, 23, 25, 28], "data": [19, 24, 31], "dataset": [49, 51, 55, 60, 61], "debug": 7, "debugopt": 33, "deep": [50, 52], "default": 29, "defin": 11, "definit": 20, "dens": 26, "depend": 58, "deprec": 42, "descript": [2, 3], "design": [10, 12, 29], "detail": 24, "devcloud": [45, 52], "develop": 7, "devic": [30, 58], "differ": [18, 27, 28], "diffus": [31, 54], "directli": 37, "directori": 9, "disabl": 52, "distribut": 58, "docker": [2, 3, 34, 41, 42, 47, 50], "dockerfil": [34, 41, 42], "dockerhub": [41, 42], "document": [4, 5, 6, 7, 63, 64], "download": [39, 40, 47, 56, 58], "driver": [37, 39, 40, 42, 46], "dtype": 28, "dump": 17, "eas": 21, "effect": 36, "efficientnet": 31, "eigen": 35, "enabl": [19, 46, 47, 48, 51, 52, 54, 55, 56, 57, 58, 60, 61, 62], "end": 18, "enforc": 0, "engin": 23, "environ": [18, 20, 29, 33, 37, 38, 39, 40, 41, 42, 45, 46, 47, 48, 49, 51, 52, 54, 55, 56, 57, 58, 60, 61, 62], "error": 27, "exampl": [16, 17, 18, 19, 22, 29, 35, 39, 40, 44, 48, 49, 51, 53, 54, 55, 57, 58, 60, 61, 62], "execut": [29, 45, 47, 48, 51, 54, 55, 56, 57, 58, 60, 61, 62], "experiment": [17, 21, 35, 37], "extens": [2, 3, 4, 6, 7, 10, 23, 33, 34, 35, 37, 39, 40, 41, 42, 45, 49, 52, 63, 64], "extra": [39, 40], "extract": 40, "faq": [22, 47, 48, 51, 54, 55, 56, 57, 60], "featur": [19, 21, 23], "file": 40, "fine": 57, "finetun": 51, "fit": 28, "flex": 31, "fold": 52, "format": 32, "fp16": 54, "fp32": [47, 54], "fp8": 57, "frequent": 14, "from": [2, 14, 34, 40, 41, 42], "full": 37, "function": 52, "further": 62, "fusion": 24, "gelu": [25, 26], "gener": 24, "get": [41, 42], "get_config": 33, "gnu": 32, "gpu": [2, 17, 21, 22, 31, 32, 37, 39, 40, 42, 45, 46, 47, 48, 50, 51, 52, 53, 54, 55, 56, 57, 58, 60, 61, 62], "gpuoption": 33, "graph": [17, 19, 21, 24, 33, 52], "graphopt": 33, "groupnorm": 25, "guid": [2, 3, 5, 7, 29, 32, 43, 46, 50], "guidelin": [0, 7], "hardwar": [28, 31, 32, 37, 39, 40, 41, 42, 45, 47, 51, 52, 54, 55, 56, 57, 60, 61, 62, 63], "header": 40, "highlight": 4, "horovod": [55, 58, 61], "how": [11, 16, 28], "hvd": 61, "i": [2, 3, 29], "identifi": 28, "ii": [2, 3, 29], "iii": [2, 29], "imag": [3, 31, 34, 55], "imagenet": 61, "implement": [11, 24], "import": 33, "improv": 18, "incept": [47, 52], "includ": 29, "incompat": 8, "index": 29, "infer": [29, 31, 47, 48, 50, 54], "infrastructur": 23, "instal": [11, 34, 37, 38, 39, 40, 41, 42, 43, 49, 53, 58, 62, 63], "instanc": [26, 29], "instruct": [37, 38], "int8": [15, 21], "integr": 40, "intel": [2, 3, 4, 6, 7, 23, 31, 32, 33, 34, 35, 37, 39, 40, 41, 42, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 60, 61, 62, 63, 64], "intel_extension_for_tensorflow": 33, "interfac": 11, "introduct": [5, 13, 23, 45, 47, 50, 51, 52, 54, 55, 56, 57, 60, 61, 62], "issu": 8, "itex": [25, 33], "itex_verbos": 20, "itexlstm": 25, "iv": 29, "ix": 29, "jemalloc": 29, "jupyt": [52, 54, 56], "kera": [27, 28], "kernel": 11, "known": 8, "lamboptim": 25, "larg": [31, 51, 57], "latenc": 29, "latest": 5, "launch": 29, "launcher": 21, "layer": 26, "layernorm": 25, "layout": [24, 32], "lead": 27, "learn": [50, 52], "level": 20, "librari": [34, 40], "licens": [52, 63], "limit": 36, "linker": 40, "linux": 37, "list": 18, "load": 40, "local": [5, 45, 52], "log": [19, 29], "logic": 29, "loop": 28, "loss": 28, "lstm": 26, "manag": 23, "manual": 19, "mask": [31, 60], "matrix": 52, "max": 31, "medic": [31, 55], "memori": [29, 32], "metal": [41, 42, 47, 50], "method": 47, "mix": [18, 19, 20, 21, 24, 28, 47], "mobilenet": 18, "mode": 29, "model": [28, 31, 34, 47, 49, 50, 51, 54, 55, 57, 60, 61], "multi": [29, 55], "multipl": 29, "name": 33, "nativ": 37, "net": 31, "neural": 49, "nextpluggabledevic": 30, "node": [29, 31], "non": 32, "normal": 26, "note": 53, "notebook": [52, 54, 56], "notic": 19, "numa": [29, 32], "numactl": 32, "number": 29, "numer": 18, "o": 55, "object": [13, 16], "omp_num_thread": 32, "one": 29, "oneapi": [37, 39, 40, 42, 46, 58], "onednn": [13, 52], "onli": [39, 40, 42], "onlin": [5, 36], "op": [11, 25, 33], "openmp": [32, 35], "openxla": [16, 21, 30], "oper": [19, 21, 25, 26, 33], "optim": [12, 13, 19, 21, 24, 58], "option": [20, 37, 39, 40, 58], "origin": 19, "other": 62, "our": 0, "output": [48, 53, 54, 58, 61, 62], "overflow": 28, "overrid": [26, 33], "overview": [15, 16, 17, 19, 20, 27, 28, 29, 30, 31, 32, 33, 36, 39, 49], "packag": [11, 40, 42, 62], "paramet": [61, 62], "patch": [58, 61], "perform": [18, 27, 31, 47], "perman": 0, "phase2": 31, "physic": 29, "pjrt": 30, "platform": 42, "pledg": 0, "pluggabledevic": 30, "plugin": 30, "polici": [1, 28], "pool": 35, "practic": 32, "pre": 49, "precis": [18, 19, 20, 21, 28, 47], "precondit": 38, "prepack": 36, "prepar": [2, 3, 40, 44, 46, 47, 48, 49, 51, 54, 55, 56, 57, 58, 60, 61, 62], "prerequisit": [11, 33, 48, 51, 54, 55, 56, 57, 60, 61, 62], "preserv": 33, "pretrain": [47, 51], "product": 31, "profil": [21, 22], "protocol": [20, 33], "public": 23, "py": 53, "pypi": [37, 39, 41, 42], "python": [7, 11, 17, 18, 20, 21, 33, 40, 47, 48, 54, 62], "pythonpath": 62, "quantiz": [15, 21, 45, 49, 52], "question": 14, "quick": [19, 50, 53], "quick_exampl": 53, "r": 60, "rcnn": 31, "recommend": 40, "refer": [16, 36, 59], "regist": 11, "releas": [5, 8, 37], "repo": 58, "report": 1, "repositori": 47, "requir": [37, 39, 40, 41, 42, 47, 51, 54, 55, 56, 57, 60, 61, 62, 63], "resnet50": [48, 61, 62], "resnet50v1": 31, "resourc": [10, 63], "respons": 0, "result": [31, 47, 51], "rule": 18, "run": [2, 3, 34, 37, 40, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 60, 61, 62], "runtim": [14, 30], "sampl": 34, "save": 19, "scale": 28, "scope": 0, "script": [2, 29, 46], "secur": [1, 63], "segment": 55, "select": 35, "seri": 37, "serv": [3, 21, 34], "server": [34, 45, 52], "set": [28, 29, 45, 49, 61, 62], "set_config": 33, "setup": [19, 28, 37, 42, 46, 47, 48, 51, 54, 55, 56, 57, 58, 60, 61, 62], "shard": 62, "shardingconfig": 33, "singl": [29, 55], "situat": 27, "skip": [47, 48, 54, 56, 61], "softwar": [31, 32, 37, 41, 42, 49, 63], "sourc": [14, 34, 39, 40], "speed": 47, "stabil": 18, "stabl": [31, 54], "standard": 0, "start": [30, 50], "startup": [52, 56], "step": [37, 38, 47, 48, 54, 56, 61], "stock": [18, 19], "structur": [9, 17], "style": 7, "subsystem": 37, "support": [21, 63], "switch": 30, "system": [37, 41, 42], "tabl": [32, 63], "tcmalloc": [29, 32], "temporari": 0, "tensorflow": [2, 3, 4, 6, 7, 18, 19, 21, 23, 33, 34, 35, 37, 39, 40, 41, 42, 45, 49, 52, 63, 64], "test": [5, 7, 47], "text": [56, 57], "text2imag": 54, "tf_num_interop_thread": 29, "tf_num_intraop_thread": 29, "thi": [47, 48, 54, 56, 61], "thread": 35, "throughput": 29, "tile": 55, "tip": [7, 19], "toolkit": [39, 40, 42, 46], "train": [19, 28, 31, 49, 50, 55, 56, 58, 60, 61, 62], "train_resnet50": 59, "tree": 9, "troubleshoot": 14, "tune": [18, 19, 57], "type": [19, 24, 28, 30], "u": 31, "ubuntu": 37, "underflow": 28, "unet": 55, "uniform": 32, "unit": 7, "up": [45, 47, 49], "updat": 5, "us": [11, 21, 27, 29, 30, 34, 35, 61], "usag": [2, 15, 17, 18, 19, 22, 26, 29, 36], "user": 29, "v": [19, 29], "v1": 31, "v3": 52, "v4": 47, "variabl": [18, 20, 29, 33, 37, 42, 47], "vasriabl": 54, "verifi": [2, 11, 37, 41, 42], "version": [5, 33, 52], "vi": 29, "via": [20, 37, 41, 42, 47], "vii": 29, "viii": 29, "virtual": [37, 41, 42, 46, 58], "vulner": 1, "w": 55, "warn": [0, 27], "weekli": 63, "weight": 36, "welcom": [4, 6, 64], "wheel": [37, 41, 42], "why": 30, "window": 37, "without": [61, 62], "work": 16, "workflow": [10, 15, 17, 36], "workload": [31, 50], "write": 11, "wsl2": 37, "x": 29, "xeon": 52, "xla": 30, "xpu": [23, 39, 40, 42, 63], "xpuautoshard": [17, 21, 62], "your": 29, "zoo": 50}})
\ No newline at end of file
+Search.setIndex({"alltitles": {"1.  Prerequisite": [[11, "prerequisite"]], "1. Build Intel\u00ae Extension for TensorFlow* C++ library": [[34, "build-intel-extension-for-tensorflow-c-library"]], "1. Correction": [[0, "correction"]], "1. Install GPU Drivers": [[37, "install-gpu-drivers"]], "2.  Define the op interface and Register op": [[11, "define-the-op-interface-and-register-op"]], "2. Build TensorFlow Serving": [[34, "build-tensorflow-serving"]], "2. Install TensorFlow* via PyPI Wheel in Linux": [[37, "install-tensorflow-via-pypi-wheel-in-linux"]], "2. Warning": [[0, "warning"]], "3.  Register the kernels for the op": [[11, "register-the-kernels-for-the-op"]], "3. Install Intel\u00ae Extension for TensorFlow*": [[37, "install-intel-extension-for-tensorflow"]], "3. Temporary Ban": [[0, "temporary-ban"]], "4.  Implement the kernels": [[11, "implement-the-kernels"]], "4. Permanent Ban": [[0, "permanent-ban"]], "4. Verify the Installation": [[37, "verify-the-installation"]], "6.  Add the op to BUILD": [[11, "add-the-op-to-build"]], "7. Use the op in Python": [[11, "use-the-op-in-python"]], "8. Build the package": [[11, "build-the-package"]], "9.  Install and Verify": [[11, "install-and-verify"]], "Accelerate 3D-Unet Training w/o horovod for medical image segmentation on Intel GPU": [[55, "accelerate-3d-unet-training-w-o-horovod-for-medical-image-segmentation-on-intel-gpu"]], "Accelerate AlexNet by Quantization with Intel\u00ae Extension for Tensorflow*": [[45, "accelerate-alexnet-by-quantization-with-intel-extension-for-tensorflow"]], "Accelerate BERT-Large Pretraining on Intel GPU": [[51, "accelerate-bert-large-pretraining-on-intel-gpu"]], "Accelerate Deep Learning Training and Inference for Model Zoo Workloads on Intel GPU": [[50, "accelerate-deep-learning-training-and-inference-for-model-zoo-workloads-on-intel-gpu"]], "Accelerate Mask R-CNN Training on Intel GPU": [[60, "accelerate-mask-r-cnn-training-on-intel-gpu"]], "Accelerate ResNet50 Training by XPUAutoShard on Intel GPU": [[62, "accelerate-resnet50-training-by-xpuautoshard-on-intel-gpu"]], "Accuracy": [[54, "accuracy"], [57, "accuracy"]], "AdamW": [[26, "adamw"]], "Additional": [[39, "additional"]], "Additional Performance Data for Intel AI Data Center Products": [[31, "additional-performance-data-for-intel-ai-data-center-products"]], "Advanced AMP vs. Stock TensorFlow AMP": [[19, "advanced-amp-vs-stock-tensorflow-amp"]], "Advanced Auto Mixed Precision": [[19, "advanced-auto-mixed-precision"], [19, "id1"]], "Advanced Auto Mixed Precision (AMP)": [[21, "advanced-auto-mixed-precision-amp"]], "Advanced Settings": [[29, "advanced-settings"]], "Advanced: Enable Advanced AMP Method": [[47, "advanced-enable-advanced-amp-method"]], "Apply Model Quantization": [[49, "apply-model-quantization"]], "Apply Patch": [[61, "apply-patch"]], "Apply Patch for Intel GPU": [[58, "apply-patch-for-intel-gpu"]], "Architecture": [[23, "architecture"]], "Attribution": [[0, "attribution"]], "Auto Mixed Precision Options": [[20, "auto-mixed-precision-options"]], "BERT Training for Classifying Text on Intel CPU and GPU": [[56, "bert-training-for-classifying-text-on-intel-cpu-and-gpu"]], "BERT-Large Phase2 Training Performance Results": [[31, "bert-large-phase2-training-performance-results"]], "BF16 + FP8 Fine-tuning": [[57, "bf16-fp8-fine-tuning"]], "Backend and Config Protocol": [[20, "backend-and-config-protocol"]], "Background": [[18, "background"], [45, "background"], [52, "background"]], "Basic Settings": [[29, "basic-settings"]], "Basic fusion": [[24, "basic-fusion"]], "Binaries Preparation": [[2, "binaries-preparation"]], "Build Docker container from Dockerfile": [[41, "build-docker-container-from-dockerfile"], [42, "build-docker-container-from-dockerfile"]], "Build Docker image from Dockerfile": [[34, "build-docker-image-from-dockerfile"]], "Build Intel\u00ae Extension for TensorFlow* CC library": [[40, "build-intel-extension-for-tensorflow-cc-library"]], "Build Intel\u00ae Extension for TensorFlow* PyPI": [[39, "build-intel-extension-for-tensorflow-pypi"]], "Build Source Code": [[39, "build-source-code"], [40, "build-source-code"]], "Build and run": [[40, "build-and-run"]], "Build from source": [[14, "build-from-source"], [34, "build-from-source"]], "Build the Docker Image": [[3, "build-the-docker-image"]], "Build to Local Test": [[5, "build-to-local-test"]], "Building the model": [[28, "building-the-model"]], "C++ coding style": [[7, "c-coding-style"]], "CPU": [[52, "cpu"]], "CPU Launcher [Experimental]": [[21, "cpu-launcher-experimental"]], "CPU Practice Guide": [[32, "cpu-practice-guide"]], "Check Currently Used Device Type": [[30, "check-currently-used-device-type"]], "Check Device Count (Optional)": [[58, "check-device-count-optional"]], "Check Intel\u00ae Advanced Matrix Extensions": [[52, "check-intel-advanced-matrix-extensions"]], "Check Intel\u00ae Deep Learning Boost": [[52, "check-intel-deep-learning-boost"]], "Check the Environment for XPU": [[42, "check-the-environment-for-xpu"]], "Clone Horovod Repo": [[58, "clone-horovod-repo"]], "Clone the Repository": [[47, "clone-the-repository"]], "Code": [[53, "code"]], "Code Structure": [[17, "code-structure"]], "Code style guide": [[7, "code-style-guide"]], "Command": [[61, "command"]], "Command with Horovod": [[61, "command-with-horovod"]], "Commands": [[51, "commands"]], "Common Execution Mode": [[29, "common-execution-mode"]], "Common Guide for Running": [[46, "common-guide-for-running"]], "Common Requirements": [[39, "common-requirements"], [40, "common-requirements"]], "Compatibility Table": [[63, "compatibility-table"]], "Conda Environment Installation Instructions": [[38, "conda-environment-installation-instructions"]], "Configuration": [[31, "configuration"], [52, "configuration"]], "Configuration List": [[18, "configuration-list"]], "Configuration via Environment Variables": [[20, "configuration-via-environment-variables"]], "Configure": [[39, "configure"], [40, "configure"]], "Configure Example For XPU": [[39, "configure-example-for-xpu"]], "Configure Example for CPU": [[39, "configure-example-for-cpu"]], "Configure For CPU": [[39, "configure-for-cpu"], [40, "configure-for-cpu"]], "Configure For GPU": [[40, "configure-for-gpu"]], "Configure For XPU": [[39, "configure-for-xpu"]], "Contributing": [[63, "contributing"]], "Contributing guidelines": [[7, "contributing-guidelines"]], "Contributing to Intel\u00ae Extension for TensorFlow*": [[7, "contributing-to-intel-extension-for-tensorflow"]], "Contributor Covenant Code of Conduct": [[0, "contributor-covenant-code-of-conduct"]], "Convergence": [[51, "convergence"]], "Create Release Version": [[5, "create-release-version"]], "Create Virtual Environment": [[58, "create-virtual-environment"]], "Create a Conda Environment": [[39, "create-a-conda-environment"], [40, "create-a-conda-environment"]], "Custom API": [[23, "custom-api"]], "Custom Operation": [[19, "custom-operation"]], "Customized Operators": [[25, "customized-operators"]], "Data Type": [[19, "data-type"]], "Default memory allocator": [[29, "default-memory-allocator"]], "Dense Layer": [[26, "dense-layer"]], "Dependency": [[58, "dependency"]], "Description": [[2, "description"], [3, "description"]], "Developing Intel\u00ae Extension for TensorFlow*": [[7, "developing-intel-extension-for-tensorflow"]], "Directory Tree Structure": [[9, "directory-tree-structure"]], "Disable Constant Folding Function": [[52, "disable-constant-folding-function"]], "Distributed Training Example with Intel\u00ae Optimization for Horovod* on Intel\u00ae GPU": [[58, "distributed-training-example-with-intel-optimization-for-horovod-on-intel-gpu"]], "Documentation": [[4, "documentation"], [63, "documentation"]], "Documentation style guide": [[7, "documentation-style-guide"]], "Download Jupyter Code:": [[56, "download-jupyter-code"]], "Download Patch": [[58, "download-patch"]], "Download Source Code": [[39, "download-source-code"], [40, "download-source-code"]], "Download the Pretrained-model": [[47, "download-the-pretrained-model"]], "Dump the graph": [[17, "dump-the-graph"]], "Ease-of-use Python API": [[21, "ease-of-use-python-api"]], "EfficientNet-B0 Inference Performance Results": [[31, "efficientnet-b0-inference-performance-results"]], "EfficientNet-B3 Inference Performance Results": [[31, "efficientnet-b3-inference-performance-results"]], "Enable Advanced AMP": [[19, "enable-advanced-amp"]], "Enable Running Environment": [[47, "enable-running-environment"], [48, "enable-running-environment"], [51, "enable-running-environment"], [54, "enable-running-environment"], [55, "enable-running-environment"], [56, "enable-running-environment"], [57, "enable-running-environment"], [60, "enable-running-environment"], [61, "enable-running-environment"], [62, "enable-running-environment"]], "Enable Virtual Running Environment": [[46, "enable-virtual-running-environment"]], "Enable oneAPI": [[58, "enable-oneapi"]], "Enable oneAPI Running Environment": [[46, "enable-oneapi-running-environment"]], "Enable oneDNN Graph": [[52, "enable-onednn-graph"]], "End-to-end Example": [[18, "end-to-end-example"]], "Enforcement": [[0, "enforcement"]], "Enforcement Guidelines": [[0, "enforcement-guidelines"]], "Enforcement Responsibilities": [[0, "enforcement-responsibilities"]], "Environment Variable Configuration": [[47, "environment-variable-configuration"]], "Environment Variable Difference with Stock TensorFlow": [[18, "environment-variable-difference-with-stock-tensorflow"]], "Environment Variables": [[20, "environment-variables"], [29, "environment-variables"]], "Environment Variables with Python APIs": [[20, "environment-variables-with-python-apis"]], "Environment Vasriable": [[54, "environment-vasriable"]], "Example": [[16, "example"], [18, "example"], [19, "example"], [35, "example"], [40, "example"]], "Example Output": [[48, "example-output"], [53, "example-output"], [54, "example-output"], [62, "example-output"]], "Example Output with hvd": [[61, "example-output-with-hvd"]], "Example Output without hvd": [[61, "example-output-without-hvd"]], "Example of Mix Precision by List": [[18, "example-of-mix-precision-by-list"]], "Example:": [[22, "example"]], "Examples": [[17, "examples"], [29, "examples"], [44, "examples"], [44, "id1"]], "Execute": [[45, "execute"], [56, "execute"]], "Execute Testing and Comparing the Performance of FP32 and Advanced AMP on CPU and GPU in Docker Container or Bare Metal": [[47, "execute-testing-and-comparing-the-performance-of-fp32-and-advanced-amp-on-cpu-and-gpu-in-docker-container-or-bare-metal"]], "Execute the Example": [[51, "execute-the-example"], [55, "execute-the-example"], [57, "execute-the-example"], [60, "execute-the-example"]], "Executes the Example with Python API": [[48, "executes-the-example-with-python-api"], [54, "executes-the-example-with-python-api"], [62, "executes-the-example-with-python-api"]], "Executing Command": [[62, "executing-command"]], "Execution": [[58, "execution"], [61, "execution"]], "Experimental Release": [[37, "experimental-release"]], "Experimental: Intel\u00ae Arc\u2122 A-Series GPU Software Installation": [[37, "experimental-intel-arc-a-series-gpu-software-installation"]], "Extension Design": [[10, "extension-design"]], "Extra Requirements for XPU Build Only": [[39, "extra-requirements-for-xpu-build-only"]], "Extra Requirements for XPU/GPU Build Only": [[40, "extra-requirements-for-xpu-gpu-build-only"]], "FAQ": [[22, "faq"], [47, "faq"], [48, "faq"], [51, "faq"], [54, "faq"], [55, "faq"], [56, "faq"], [57, "faq"], [60, "faq"]], "FP16 Inference": [[54, "fp16-inference"]], "FP32 Inference": [[54, "fp32-inference"]], "FP8 BERT-Large Fine-tuning for Classifying Text on Intel GPU": [[57, "fp8-bert-large-fine-tuning-for-classifying-text-on-intel-gpu"]], "Feature": [[19, "feature"]], "Features": [[21, "features"]], "Finetune Command": [[51, "finetune-command"]], "Frequently Asked Questions": [[14, "frequently-asked-questions"]], "Further Settings": [[62, "further-settings"]], "GNU OpenMP": [[32, "gnu-openmp"]], "GPU": [[45, "gpu"], [52, "gpu"]], "GPU Practice Guide": [[32, "gpu-practice-guide"]], "GPU Profiler": [[21, "gpu-profiler"], [22, "gpu-profiler"]], "Gelu Activation": [[26, "gelu-activation"]], "Generic layout optimizer": [[24, "generic-layout-optimizer"]], "Get docker container from dockerhub": [[41, "get-docker-container-from-dockerhub"], [42, "get-docker-container-from-dockerhub"]], "Graph Optimization": [[21, "graph-optimization"]], "Graph Optimizer": [[19, "graph-optimizer"]], "Graph fusion": [[24, "graph-fusion"]], "Hardware Configuration": [[31, "hardware-configuration"], [32, "hardware-configuration"]], "Hardware Configuration for Intel Flex 170 GPU": [[31, "hardware-configuration-for-intel-flex-170-gpu"]], "Hardware Configuration for Intel Max 1550 GPU": [[31, "hardware-configuration-for-intel-max-1550-gpu"]], "Hardware Environment": [[45, "hardware-environment"], [52, "hardware-environment"]], "Hardware Requirement": [[47, "hardware-requirement"], [63, "hardware-requirement"]], "Hardware Requirements": [[37, "hardware-requirements"], [39, "hardware-requirements"], [40, "hardware-requirements"], [41, "hardware-requirements"], [42, "hardware-requirements"], [51, "hardware-requirements"], [54, "hardware-requirements"], [55, "hardware-requirements"], [56, "hardware-requirements"], [57, "hardware-requirements"], [60, "hardware-requirements"], [61, "hardware-requirements"], [62, "hardware-requirements"]], "Highlights": [[4, "highlights"]], "How it works": [[16, "how-it-works"]], "How to identify different hardware types?": [[28, "how-to-identify-different-hardware-types"]], "How to write custom op": [[11, "how-to-write-custom-op"]], "I. Binaries Preparation": [[3, "i-binaries-preparation"]], "I. Customize Build Script": [[2, "i-customize-build-script"]], "I. Use all physical cores": [[29, "i-use-all-physical-cores"]], "II. Build the Container": [[2, "ii-build-the-container"], [3, "ii-build-the-container"]], "II. Use all cores including logical cores": [[29, "ii-use-all-cores-including-logical-cores"]], "III. Running the Container": [[2, "iii-running-the-container"]], "III. Use physical cores on one node": [[29, "iii-use-physical-cores-on-one-node"]], "INT8 Quantization": [[15, "int8-quantization"], [21, "int8-quantization"]], "ITEX_VERBOSE level definition": [[20, "itex-verbose-level-definition"]], "IV. Use your designated number of cores": [[29, "iv-use-your-designated-number-of-cores"]], "IX. Set environment variable TF_NUM_INTRAOP_THREADS": [[29, "ix-set-environment-variable-tf-num-intraop-threads"]], "If not use Horovod": [[61, "if-not-use-horovod"]], "If use Horovod": [[61, "if-use-horovod"]], "Implementation Details": [[24, "implementation-details"]], "Incompatible Changes": [[8, "incompatible-changes"]], "Inference Performance Results": [[31, "inference-performance-results"]], "Inference Performance on 1x Intel Data Center GPU Flex 170": [[31, "inference-performance-on-1x-intel-data-center-gpu-flex-170"]], "Inference Workloads": [[31, "inference-workloads"]], "Infrastructure": [[23, "infrastructure"]], "Install": [[58, "install"], [63, "install"]], "Install Bazel": [[39, "install-bazel"], [40, "install-bazel"]], "Install Clang-17 compiler": [[39, "install-clang-17-compiler"]], "Install GPU Drivers": [[42, "install-gpu-drivers"]], "Install Intel GPU Driver": [[39, "install-intel-gpu-driver"], [40, "install-intel-gpu-driver"]], "Install Intel\u00ae Extension for TensorFlow*": [[41, "install-intel-extension-for-tensorflow"], [42, "install-intel-extension-for-tensorflow"]], "Install Intel\u00ae Extension for Tensorflow*": [[49, "install-intel-extension-for-tensorflow"]], "Install Intel\u00ae Neural Compressor": [[49, "install-intel-neural-compressor"]], "Install Model Server": [[34, "install-model-server"]], "Install Other Required Packages": [[62, "install-other-required-packages"]], "Install TensorFlow": [[37, "install-tensorflow"], [39, "install-tensorflow"], [40, "install-tensorflow"], [41, "install-tensorflow"], [42, "install-tensorflow"]], "Install TensorFlow Serving with Intel\u00ae Extension for TensorFlow*": [[34, "install-tensorflow-serving-with-intel-extension-for-tensorflow"]], "Install for CPU": [[63, "install-for-cpu"]], "Install for CPU weekly": [[63, "install-for-cpu-weekly"]], "Install for XPU": [[63, "install-for-xpu"]], "Install for XPU weekly": [[63, "install-for-xpu-weekly"]], "Install for weekly binaries": [[63, "install-for-weekly-binaries"]], "Install oneAPI Base Toolkit": [[39, "install-oneapi-base-toolkit"], [40, "install-oneapi-base-toolkit"]], "Install oneAPI Base Toolkit Packages": [[42, "install-oneapi-base-toolkit-packages"]], "Install using Docker": [[34, "install-using-docker"]], "Install via Docker container": [[41, "install-via-docker-container"], [42, "install-via-docker-container"]], "Install via PyPI wheel in bare metal": [[41, "install-via-pypi-wheel-in-bare-metal"], [42, "install-via-pypi-wheel-in-bare-metal"]], "Installation": [[53, "installation"]], "Installation Channel:": [[63, "installation-channel"]], "Installation Guide": [[43, "installation-guide"]], "Instance Normalization": [[26, "instance-normalization"]], "Integrate the CC library": [[40, "integrate-the-cc-library"]], "Intel Advanced Feature and Extension Management": [[23, "intel-advanced-feature-and-extension-management"]], "Intel CPU Software Installation": [[41, "intel-cpu-software-installation"]], "Intel GPU Driver": [[46, "intel-gpu-driver"]], "Intel OpenMP": [[32, "intel-openmp"]], "Intel XPU Software Installation": [[42, "intel-xpu-software-installation"]], "Intel\u00ae DevCloud": [[45, "intel-devcloud"], [52, "intel-devcloud"]], "Intel\u00ae Extension for TensorFlow*": [[63, "intel-extension-for-tensorflow"]], "Intel\u00ae Extension for TensorFlow* Config Protocol": [[33, "intel-extension-for-tensorflow-config-protocol"]], "Intel\u00ae Extension for TensorFlow* Docker Container Guide": [[2, "intel-extension-for-tensorflow-docker-container-guide"]], "Intel\u00ae Extension for TensorFlow* Serving - Docker Container Guide": [[3, "intel-extension-for-tensorflow-serving-docker-container-guide"]], "Intel\u00ae Extension for TensorFlow* for C++": [[40, "intel-extension-for-tensorflow-for-c"]], "Intel\u00ae Extension for Tensorflow* Model Quantization API Example": [[49, "intel-extension-for-tensorflow-model-quantization-api-example"]], "Intel\u00ae Extension for Tensorflow* Version": [[52, "intel-extension-for-tensorflow-version"]], "Intel\u00ae oneAPI Base Toolkit": [[46, "intel-oneapi-base-toolkit"]], "Introduction": [[5, "introduction"], [13, "introduction"], [23, "introduction"], [45, "introduction"], [47, "introduction"], [50, "introduction"], [51, "introduction"], [52, "introduction"], [54, "introduction"], [55, "introduction"], [56, "introduction"], [57, "introduction"], [60, "introduction"], [61, "introduction"], [62, "introduction"]], "Jemalloc": [[29, "jemalloc"]], "Keras 3 Overview": [[27, "keras-3-overview"]], "Keras Mixed Precision": [[28, "keras-mixed-precision"]], "Known Issues": [[8, "known-issues"]], "LSTM": [[26, "lstm"]], "Latency mode": [[29, "latency-mode"]], "Launch Log": [[29, "launch-log"]], "Launch Script User Guide": [[29, "launch-script-user-guide"]], "Layer Normalization": [[26, "layer-normalization"]], "License": [[52, "license"], [63, "license"]], "Limitation": [[36, "limitation"]], "Linker": [[40, "linker"]], "Load": [[40, "load"]], "Local Server": [[45, "local-server"], [52, "local-server"]], "Log and Save Optimized Graph": [[19, "log-and-save-optimized-graph"]], "Loss scaling": [[28, "loss-scaling"]], "Loss scaling overview": [[28, "loss-scaling-overview"]], "Mask-RCNN Inference Performance Results": [[31, "mask-rcnn-inference-performance-results"]], "Mask-RCNN Training Performance Results": [[31, "mask-rcnn-training-performance-results"]], "Medical Image 3D U-Net Training Performance Results": [[31, "medical-image-3d-u-net-training-performance-results"]], "Memory Allocator": [[29, "memory-allocator"], [32, "memory-allocator"]], "Memory Layout format": [[32, "memory-layout-format"]], "Mixed data type fusion": [[24, "mixed-data-type-fusion"]], "Model Code change": [[51, "model-code-change"], [54, "model-code-change"], [55, "model-code-change"], [57, "model-code-change"], [60, "model-code-change"], [61, "model-code-change"]], "Models": [[31, "models"]], "Multi-instance": [[29, "multi-instance"]], "Multi-tile with horovod": [[55, "multi-tile-with-horovod"]], "Multiple instances for inference": [[29, "multiple-instances-for-inference"]], "NUMA Control": [[29, "numa-control"]], "Native Linux Running Directly on Hardware": [[37, "native-linux-running-directly-on-hardware"], [37, "id2"]], "NextPluggableDevice Architecture": [[30, "nextpluggabledevice-architecture"]], "NextPluggableDevice Overview": [[30, "nextpluggabledevice-overview"]], "Non-Uniform Memory Access (NUMA)": [[32, "non-uniform-memory-access-numa"]], "Notes": [[53, "notes"]], "Notice": [[19, "notice"]], "Numactl": [[32, "numactl"]], "Numeric Stability": [[18, "numeric-stability"]], "OMP_NUM_THREADS": [[32, "omp-num-threads"]], "Objectives": [[16, "objectives"]], "Online Documentation Build Guide": [[5, "online-documentation-build-guide"]], "Online Weight Prepack": [[36, "online-weight-prepack"]], "OpenMP": [[32, "openmp"]], "OpenXLA": [[16, "openxla"]], "OpenXLA PJRT Plugin": [[30, "openxla-pjrt-plugin"]], "OpenXLA Support on GPU [Experimental]": [[21, "openxla-support-on-gpu-experimental"]], "Operator Optimization": [[21, "operator-optimization"]], "Operators Override": [[26, "operators-override"]], "Optimization in convolution": [[13, "optimization-in-convolution"]], "Optimizations Design": [[12, "optimizations-design"]], "Option 1: Extract from Tensorflow* python package (Recommended)": [[40, "option-1-extract-from-tensorflow-python-package-recommended"]], "Option 2: Build from TensorFlow* source code": [[40, "option-2-build-from-tensorflow-source-code"]], "Optional Requirements for CPU Build Only": [[39, "optional-requirements-for-cpu-build-only"]], "Optional: Install Full Intel\u00ae oneAPI": [[37, "optional-install-full-intel-oneapi"]], "Original Code": [[19, "original-code"]], "Our Pledge": [[0, "our-pledge"]], "Our Standards": [[0, "our-standards"]], "Output": [[58, "output"]], "Overview": [[15, "overview"], [16, "overview"], [17, "overview"], [19, "overview"], [20, "overview"], [28, "overview"], [29, "overview"], [31, "overview"], [32, "overview"], [33, "overview"], [36, "overview"], [39, "overview"], [49, "overview"]], "Performance Data": [[31, "performance-data"]], "Practice Guide": [[32, "practice-guide"]], "Preconditions": [[38, "preconditions"]], "Prepare": [[46, "prepare"]], "Prepare Dataset": [[49, "prepare-dataset"], [51, "prepare-dataset"], [55, "prepare-dataset"], [60, "prepare-dataset"]], "Prepare Example Code": [[58, "prepare-example-code"]], "Prepare ImageNet dataset": [[61, "prepare-imagenet-dataset"]], "Prepare Pre-Trained Model": [[49, "prepare-pre-trained-model"]], "Prepare Tensorflow* CC library and header files": [[40, "prepare-tensorflow-cc-library-and-header-files"]], "Prepare for GPU": [[51, "prepare-for-gpu"], [55, "prepare-for-gpu"], [57, "prepare-for-gpu"], [60, "prepare-for-gpu"], [62, "prepare-for-gpu"]], "Prepare for GPU (Skip this Step for CPU)": [[47, "prepare-for-gpu-skip-this-step-for-cpu"]], "Prepare for GPU (Skip this step for CPU)": [[48, "prepare-for-gpu-skip-this-step-for-cpu"], [54, "prepare-for-gpu-skip-this-step-for-cpu"], [56, "prepare-for-gpu-skip-this-step-for-cpu"], [61, "prepare-for-gpu-skip-this-step-for-cpu"]], "Prepare for Running": [[44, "prepare-for-running"]], "Prepare the Codes": [[62, "prepare-the-codes"]], "Prerequisite: import intel_extension_for_tensorflow as itex": [[33, "prerequisite-import-intel-extension-for-tensorflow-as-itex"]], "Prerequisites": [[48, "prerequisites"], [51, "prerequisites"], [51, "id1"], [51, "id2"], [54, "prerequisites"], [55, "prerequisites"], [56, "prerequisites"], [57, "prerequisites"], [60, "prerequisites"], [61, "prerequisites"], [62, "prerequisites"]], "Pretraining Command": [[51, "pretraining-command"]], "Python API": [[17, "python-api"], [18, "python-api"], [47, "python-api"], [62, "python-api"]], "Python API Attribute & Environment Variable": [[18, "python-api-attribute-environment-variable"]], "Python APIs": [[33, "python-apis"]], "Python APIs and Environment Variable Names": [[33, "python-apis-and-environment-variable-names"]], "Python APIs and preserved environment variable Names": [[33, "python-apis-and-preserved-environment-variable-names"]], "Python Unit Testing": [[7, "python-unit-testing"]], "Python coding style": [[7, "python-coding-style"]], "Quantize Inception V3 by Intel\u00ae Extension for Tensorflow* on Intel\u00ae Xeon\u00ae": [[52, "quantize-inception-v3-by-intel-extension-for-tensorflow-on-intel-xeon"]], "Quick Example on Intel CPU and GPU": [[53, "quick-example-on-intel-cpu-and-gpu"]], "Quick Start Guide": [[50, "quick-start-guide"]], "Quick Training Example": [[19, "quick-training-example"]], "Refer to train_resnet50": [[59, "refer-to-train-resnet50"]], "Reference": [[36, "reference"]], "References": [[16, "references"]], "Releases": [[8, "releases"]], "Report a Vulnerability": [[1, "report-a-vulnerability"]], "Requirements": [[39, "requirements"], [40, "requirements"]], "ResNet50 Inference on Intel CPU and GPU": [[48, "resnet50-inference-on-intel-cpu-and-gpu"]], "ResNet50v1-5 Inference Performance Results": [[31, "resnet50v1-5-inference-performance-results"]], "ResNet50v1-5 Training Performance Results": [[31, "resnet50v1-5-training-performance-results"]], "Resnet50 train on Intel GPU": [[61, "resnet50-train-on-intel-gpu"]], "Resources": [[10, "resources"], [63, "resources"]], "Result": [[47, "result"]], "Results": [[51, "results"]], "Rule to Improve Performance by the Configuration List": [[18, "rule-to-improve-performance-by-the-configuration-list"]], "Run Model Quantization Example:": [[49, "run-model-quantization-example"]], "Run Models in the Docker Container": [[50, "run-models-in-the-docker-container"]], "Run Models on Bare Metal": [[50, "run-models-on-bare-metal"]], "Run Script": [[46, "run-script"]], "Run sample": [[34, "run-sample"]], "Running": [[46, "running"]], "Running Command": [[58, "running-command"]], "Running Environment": [[45, "running-environment"], [52, "running-environment"]], "Running the Container": [[3, "running-the-container"]], "Running the Jupyter Notebook": [[54, "running-the-jupyter-notebook"]], "Runtime": [[14, "runtime"]], "Runtime Switch of NextPluggableDevice and PluggableDevice": [[30, "runtime-switch-of-nextpluggabledevice-and-pluggabledevice"]], "Scope": [[0, "scope"]], "Security": [[63, "security"]], "Security Policy": [[1, "security-policy"]], "Selecting Thread Pool in Intel\u00ae Extension for TensorFlow* CPU [Experimental]": [[35, "selecting-thread-pool-in-intel-extension-for-tensorflow-cpu-experimental"]], "Set Model Parameters": [[61, "set-model-parameters"]], "Set Up Software Environment": [[49, "set-up-software-environment"]], "Set environment variables for inference": [[29, "set-environment-variables-for-inference"]], "Set up Base Running Environment": [[45, "set-up-base-running-environment"]], "Set up Intel\u00ae Extension for Tensorflow* for GPU": [[45, "set-up-intel-extension-for-tensorflow-for-gpu"]], "Setting the dtype policy": [[28, "setting-the-dtype-policy"]], "Setup": [[19, "setup"], [28, "setup"]], "Setup PYTHONPATH": [[62, "setup-pythonpath"]], "Setup Running Environment": [[46, "setup-running-environment"], [47, "setup-running-environment"], [48, "setup-running-environment"], [51, "setup-running-environment"], [54, "setup-running-environment"], [55, "setup-running-environment"], [56, "setup-running-environment"], [57, "setup-running-environment"], [58, "setup-running-environment"], [60, "setup-running-environment"], [61, "setup-running-environment"]], "Setup environment variables": [[37, "setup-environment-variables"], [42, "setup-environment-variables"]], "Sharding Parameters Setting": [[62, "sharding-parameters-setting"]], "Single Tile": [[55, "single-tile"]], "Single instance for inference": [[29, "single-instance-for-inference"]], "Situations leads to warning or Error": [[27, "situations-leads-to-warning-or-error"]], "Software Configuration": [[31, "software-configuration"], [32, "software-configuration"]], "Software Configuration for Intel Flex 170 GPU": [[31, "software-configuration-for-intel-flex-170-gpu"]], "Software Configuration for Intel Max 1550 GPU": [[31, "software-configuration-for-intel-max-1550-gpu"]], "Software Requirement": [[63, "software-requirement"]], "Software Requirements": [[37, "software-requirements"], [41, "software-requirements"], [42, "software-requirements"]], "Speed up Inference of Inception v4 by Advanced Automatic Mixed Precision on Intel CPU and GPU via Docker Container or Bare Metal": [[47, "speed-up-inference-of-inception-v4-by-advanced-automatic-mixed-precision-on-intel-cpu-and-gpu-via-docker-container-or-bare-metal"]], "Stable Diffusion Inference for Text2Image on Intel GPU": [[54, "stable-diffusion-inference-for-text2image-on-intel-gpu"]], "Stable Diffusion v1-4 Inference Performance Results": [[31, "stable-diffusion-v1-4-inference-performance-results"]], "Start with XLA using NextPluggableDevice": [[30, "start-with-xla-using-nextpluggabledevice"]], "Startup Jupyter Notebook": [[52, "startup-jupyter-notebook"], [56, "startup-jupyter-notebook"]], "Step": [[47, "step"]], "Step by step instructions:": [[38, "step-by-step-instructions"]], "Step-By-Step Instructions": [[37, "step-by-step-instructions"]], "Support": [[63, "support"]], "System environment install": [[37, "system-environment-install"], [41, "system-environment-install"], [42, "system-environment-install"]], "TCMalloc": [[29, "tcmalloc"], [32, "tcmalloc"]], "Table of Contents": [[32, "table-of-contents"]], "TensorFlow Public API": [[23, "tensorflow-public-api"]], "TensorFlow Serving": [[21, "tensorflow-serving"]], "Throughput mode": [[29, "throughput-mode"]], "Tips": [[19, "tips"]], "Tips and Debugging": [[7, "tips-and-debugging"]], "Training Accuracy Results": [[31, "training-accuracy-results"]], "Training Accuracy on 1-node of 4x Intel Data Center GPU Max 1550": [[31, "training-accuracy-on-1-node-of-4x-intel-data-center-gpu-max-1550"]], "Training Performance Results": [[31, "training-performance-results"]], "Training Performance on 1-node of 4x Intel Data Center GPU Max 1550": [[31, "training-performance-on-1-node-of-4x-intel-data-center-gpu-max-1550"]], "Training Workloads": [[31, "training-workloads"]], "Training the model with Model.fit": [[28, "training-the-model-with-model-fit"]], "Training the model with a custom training loop": [[28, "training-the-model-with-a-custom-training-loop"]], "Troubleshooting": [[14, "troubleshooting"]], "Tune Advanced AMP Manually": [[19, "tune-advanced-amp-manually"]], "Tune Advanced Auto Mixed Precision": [[18, "tune-advanced-auto-mixed-precision"]], "Tuning Performance Example on MobileNet": [[18, "tuning-performance-example-on-mobilenet"]], "Ubuntu Linux Installed in WSL2": [[37, "ubuntu-linux-installed-in-wsl2"]], "Underflow and Overflow": [[28, "underflow-and-overflow"]], "Unit testing": [[7, "unit-testing"]], "Update latest Version": [[5, "update-latest-version"]], "Usage": [[15, "usage"], [17, "usage"], [18, "usage"], [18, "id1"], [19, "usage"], [22, "usage"], [26, "usage"]], "Usage & Effect": [[36, "usage-effect"]], "Usage of Docker Container": [[2, "usage-of-docker-container"]], "Usage of TCMalloc/Jemalloc/Default memory allocator": [[29, "usage-of-tcmalloc-jemalloc-default-memory-allocator"]], "Use Case with different performance": [[27, "use-case-with-different-performance"]], "Using Eigen Thread Pool": [[35, "using-eigen-thread-pool"]], "Using OpenMP Thread Pool": [[35, "using-openmp-thread-pool"]], "V. Throughput mode": [[29, "v-throughput-mode"]], "VI. Latency mode": [[29, "vi-latency-mode"]], "VII. Your designated number of instances": [[29, "vii-your-designated-number-of-instances"]], "VIII. Your designated number of instances and instance index": [[29, "viii-your-designated-number-of-instances-and-instance-index"]], "Verify That Intel GPU is Accessible From TensorFlow": [[2, "verify-that-intel-gpu-is-accessible-from-tensorflow"]], "Verify the Installation": [[41, "verify-the-installation"], [42, "verify-the-installation"]], "Virtual environment install": [[37, "virtual-environment-install"], [41, "virtual-environment-install"], [42, "virtual-environment-install"]], "Welcome to Intel \u00ae Extension for TensorFlow* documentation!": [[6, "welcome-to-intel-extension-for-tensorflow-documentation"], [64, "welcome-to-intel-extension-for-tensorflow-documentation"]], "Welcome to Intel\u00ae Extension for TensorFlow* documentation": [[4, "welcome-to-intel-extension-for-tensorflow-documentation"]], "Why NextPluggableDevice": [[30, "why-nextpluggabledevice"]], "Windows GPU Drivers": [[37, "windows-gpu-drivers"]], "Windows Subsystem for Linux 2 (WSL2)": [[37, "windows-subsystem-for-linux-2-wsl2"], [37, "id1"]], "With XPUAutoShard": [[62, "with-xpuautoshard"]], "Without XPUAutoShard": [[62, "without-xpuautoshard"]], "Workflow": [[10, "workflow"], [15, "workflow"], [17, "workflow"], [36, "workflow"]], "X. Set environment variable TF_NUM_INTEROP_THREADS": [[29, "x-set-environment-variable-tf-num-interop-threads"]], "XPU Engine": [[23, "xpu-engine"]], "XPU for CPU only platform (Deprecated)": [[42, "xpu-for-cpu-only-platform-deprecated"]], "XPUAutoShard on GPU [Experimental]": [[17, "xpuautoshard-on-gpu-experimental"], [21, "xpuautoshard-on-gpu-experimental"]], "bazel style guide": [[7, "bazel-style-guide"]], "itex graph": [[33, "itex-graph"]], "itex operators": [[33, "itex-operators"]], "itex ops override": [[33, "itex-ops-override"]], "itex version": [[33, "itex-version"]], "itex.AutoMixedPrecisionOptions": [[33, "itex-automixedprecisionoptions"]], "itex.ConfigProto": [[33, "itex-configproto"]], "itex.DebugOptions": [[33, "itex-debugoptions"]], "itex.GPUOptions": [[33, "itex-gpuoptions"]], "itex.GraphOptions": [[33, "itex-graphoptions"]], "itex.ShardingConfig": [[33, "itex-shardingconfig"]], "itex.get_config": [[33, "itex-get-config"]], "itex.ops.AdamWithWeightDecayOptimizer": [[25, "itex-ops-adamwithweightdecayoptimizer"]], "itex.ops.GroupNormalization": [[25, "itex-ops-groupnormalization"]], "itex.ops.ItexLSTM": [[25, "itex-ops-itexlstm"]], "itex.ops.LAMBOptimizer": [[25, "itex-ops-lamboptimizer"]], "itex.ops.LayerNormalization": [[25, "itex-ops-layernormalization"]], "itex.ops.gelu": [[25, "itex-ops-gelu"]], "itex.set_config": [[33, "itex-set-config"]], "oneDNN object cache optimization": [[13, "onednn-object-cache-optimization"]], "quick_example.py": [[53, "quick-example-py"]]}, "docnames": ["CODE_OF_CONDUCT", "SECURITY", "docker/README", "docker/tensorflow-serving/README", "docs/README", "docs/build_docs/docs_build_tips", "docs/build_docs/source/index", "docs/community/contributing", "docs/community/releases", "docs/design/directory_structure", "docs/design/extension_design", "docs/design/how_to_write_custom_op", "docs/design/optimization/README", "docs/design/optimization/oneDNN_object_cache", "docs/guide/FAQ", "docs/guide/INT8_quantization", "docs/guide/OpenXLA", "docs/guide/XPUAutoShard", "docs/guide/aamp_tune", "docs/guide/advanced_auto_mixed_precision", "docs/guide/environment_variables", "docs/guide/features", "docs/guide/how_to_enable_profiler", "docs/guide/infrastructure", "docs/guide/itex_fusion", "docs/guide/itex_ops", "docs/guide/itex_ops_override", "docs/guide/keras3_support", "docs/guide/keras_mixed_precision", "docs/guide/launch", "docs/guide/next_pluggable_device", "docs/guide/performance", "docs/guide/practice_guide", "docs/guide/python_api", "docs/guide/tf_serving_install", "docs/guide/threadpool", "docs/guide/weight_prepack", "docs/install/experimental/install_for_arc_gpu", "docs/install/experimental/install_for_gpu_conda", "docs/install/how_to_build", "docs/install/install_for_cpp", "docs/install/install_for_cpu", "docs/install/install_for_xpu", "docs/install/installation_guide", "examples/README", "examples/accelerate_alexnet_by_quantization/README", "examples/common_guide_running", "examples/infer_inception_v4_amp/README", "examples/infer_resnet50/README", "examples/itex_quantization_example/README", "examples/model_zoo_example/README", "examples/pretrain_bert/README", "examples/quantize_inception_v3/README", "examples/quick_example", "examples/stable_diffussion_inference/README", "examples/train_3d_unet/README", "examples/train_bert/README", "examples/train_bert_fp8/README", "examples/train_horovod/mnist/README", "examples/train_horovod/resnet50/README", "examples/train_maskrcnn/README", "examples/train_resnet50/README", "examples/train_resnet50_with_autoshard/README", "get_started", "index"], "envversion": {"sphinx": 61, "sphinx.domains.c": 3, "sphinx.domains.changeset": 1, "sphinx.domains.citation": 1, "sphinx.domains.cpp": 9, "sphinx.domains.index": 1, "sphinx.domains.javascript": 3, "sphinx.domains.math": 2, "sphinx.domains.python": 4, "sphinx.domains.rst": 2, "sphinx.domains.std": 2}, "filenames": ["CODE_OF_CONDUCT.md", "SECURITY.md", "docker/README.md", "docker/tensorflow-serving/README.md", "docs/README.md", "docs/build_docs/docs_build_tips.md", "docs/build_docs/source/index.rst", "docs/community/contributing.md", "docs/community/releases.md", "docs/design/directory_structure.md", "docs/design/extension_design.md", "docs/design/how_to_write_custom_op.md", "docs/design/optimization/README.md", "docs/design/optimization/oneDNN_object_cache.md", "docs/guide/FAQ.md", "docs/guide/INT8_quantization.md", "docs/guide/OpenXLA.md", "docs/guide/XPUAutoShard.md", "docs/guide/aamp_tune.md", "docs/guide/advanced_auto_mixed_precision.md", "docs/guide/environment_variables.md", "docs/guide/features.rst", "docs/guide/how_to_enable_profiler.md", "docs/guide/infrastructure.md", "docs/guide/itex_fusion.md", "docs/guide/itex_ops.md", "docs/guide/itex_ops_override.md", "docs/guide/keras3_support.md", "docs/guide/keras_mixed_precision.md", "docs/guide/launch.md", "docs/guide/next_pluggable_device.md", "docs/guide/performance.md", "docs/guide/practice_guide.md", "docs/guide/python_api.md", "docs/guide/tf_serving_install.md", "docs/guide/threadpool.md", "docs/guide/weight_prepack.md", "docs/install/experimental/install_for_arc_gpu.md", "docs/install/experimental/install_for_gpu_conda.md", "docs/install/how_to_build.md", "docs/install/install_for_cpp.md", "docs/install/install_for_cpu.md", "docs/install/install_for_xpu.md", "docs/install/installation_guide.rst", "examples/README.md", "examples/accelerate_alexnet_by_quantization/README.md", "examples/common_guide_running.md", "examples/infer_inception_v4_amp/README.md", "examples/infer_resnet50/README.md", "examples/itex_quantization_example/README.md", "examples/model_zoo_example/README.md", "examples/pretrain_bert/README.md", "examples/quantize_inception_v3/README.md", "examples/quick_example.md", "examples/stable_diffussion_inference/README.md", "examples/train_3d_unet/README.md", "examples/train_bert/README.md", "examples/train_bert_fp8/README.md", "examples/train_horovod/mnist/README.md", "examples/train_horovod/resnet50/README.md", "examples/train_maskrcnn/README.md", "examples/train_resnet50/README.md", "examples/train_resnet50_with_autoshard/README.md", "get_started.md", "index.rst"], "indexentries": {}, "objects": {}, "objnames": {}, "objtypes": {}, "terms": {"": [0, 4, 5, 14, 16, 18, 20, 21, 28, 31, 32, 34, 35, 39, 40, 45, 47, 49, 51, 52, 54, 55, 56, 63], "0": [2, 3, 4, 5, 11, 14, 15, 16, 19, 20, 22, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 37, 38, 39, 40, 41, 42, 45, 48, 49, 51, 52, 53, 56, 57, 58, 60, 61, 62, 63], "00": [16, 31, 42, 49, 61], "000": 28, "000000e": 51, "0001": 49, "0005": 51, "000611": 51, "001": [25, 26], "00363725": 25, "004": 51, "00404969": 25, "004888": 51, "006297": 61, "006950": 58, "00x": 31, "01": [14, 16, 26, 31, 33, 49, 61], "0113076031208038": 47, "01837550401687622": 47, "02": [16, 26, 28, 31, 61], "025180": 62, "027671": 62, "03": [29, 31, 51, 61], "037595": 51, "04": [2, 16, 31, 34, 35, 37, 39, 41, 42, 49, 56], "05": [16, 29, 31, 58], "0527704": 53, "06": [14, 16, 25, 28, 51], "061277": 28, "061301": 28, "061306": 28, "063685": 28, "063851": 28, "063865": 28, "0656753": 53, "07": [14, 16, 25, 31, 42, 61, 62], "072701": 51, "072752": 51, "072779": 51, "072805": 51, "072829": 51, "072861": 51, "072884": 51, "072928": 51, "073072": 51, "073094": 51, "073121": 51, "073183": 51, "077278": 53, "08": [16, 29, 35, 61], "089": 29, "09": [16, 29, 61], "090": 29, "0f": 11, "1": [2, 4, 5, 14, 16, 18, 19, 20, 21, 22, 25, 26, 27, 28, 29, 30, 32, 33, 35, 36, 38, 39, 42, 47, 49, 51, 52, 53, 54, 55, 56, 57, 58, 60, 61, 62, 63], "10": [2, 14, 16, 18, 19, 25, 28, 29, 35, 36, 37, 39, 40, 41, 49, 51, 52, 61, 62, 63], "100": [11, 28, 33, 39, 51], "1000": [31, 34, 55, 61], "10000": [19, 25, 28], "101": 37, "1024": [28, 31], "1024_a": 51, "1024gb": 31, "103148": 62, "105446": 51, "107809": 58, "10gbase": 31, "11": [16, 18, 29, 31, 37, 38, 39, 40, 42, 61, 63], "111": [28, 32], "112": 32, "114": [28, 58], "1146879196167": 54, "11490434": 28, "116": 14, "118": [28, 30], "118212": 53, "1193419": 53, "12": [7, 14, 16, 28, 29, 31, 42, 51, 54, 56, 58, 61, 62, 63], "1200": 61, "122": 33, "122414": 51, "122509": 51, "12278": 31, "127": [5, 34], "128": [16, 31, 47, 51, 57], "128gb": 31, "129": 29, "12_h": 51, "12e": 51, "13": [16, 40, 52, 58, 62, 63], "133": 49, "136": 29, "137": 29, "139660941027136": 61, "139898862851904": 61, "14": [28, 31, 34, 40, 49, 51, 56, 58, 61, 63], "140": [39, 40], "140348344015936": 62, "1403804": 53, "140612319840064": 61, "141": 11, "144": 29, "1445": 11, "145": [29, 61, 62], "1455178": 53, "15": [2, 7, 16, 29, 31, 35, 37, 38, 39, 40, 41, 42, 45, 51, 63], "150": 55, "15000": 25, "15031084974591766410": 2, "150400": 31, "150w": 31, "1550": 16, "156": 28, "15865526": 25, "158808": 25, "16": [18, 28, 29, 31, 33, 41, 47, 51, 61], "161625": 62, "163": 49, "163161": 58, "163517": 58, "163815": 62, "1657011814330": 18, "1657011815538": 18, "1658201": 53, "1666": 51, "1691980294577": 47, "16x64gb": 31, "17": [29, 40], "170": [39, 40, 42, 54, 57], "1704025": 53, "170intel": 47, "1729176": 53, "174": 56, "17448926295332318308": 2, "1762": 31, "1766": 31, "177216": 51, "178206": 61, "18": [16, 51, 58], "182": 31, "1846": 51, "185w": 31, "19": [29, 31, 37, 41, 42], "1900": 61, "190052": 51, "190136": 51, "190169": 51, "190193": 51, "190217": 51, "190249": 51, "190273": 51, "190343": 51, "190536": 51, "190559": 51, "190587": 51, "190668": 51, "191": 29, "192": [29, 51], "197306": 53, "198": 29, "1986": 28, "1997": 25, "1a": 40, "1ccb4fee": 38, "1e": [25, 26, 28], "1export": [18, 19], "1tb": 31, "1u": 28, "2": [2, 14, 15, 16, 17, 18, 19, 20, 24, 25, 27, 28, 29, 30, 31, 32, 33, 35, 36, 38, 39, 41, 42, 45, 47, 48, 49, 51, 52, 53, 54, 55, 57, 58, 60, 61, 62, 63], "20": [16, 29, 31, 35, 39, 41, 60, 62], "200": [25, 26, 51], "2000": [51, 61], "200m": 32, "2016": 25, "2017": [31, 60], "2018": 49, "20180905": 33, "2019": 55, "20200711": 49, "2021": 14, "2022": [28, 29, 33], "2023": [38, 42, 49, 51, 58], "20230123": 21, "2024": [14, 31, 37, 42], "206": 29, "207": 29, "21": [29, 31, 51], "210": 49, "2100": 61, "2134862": 53, "215": 29, "2155": 28, "216": 29, "217981": 42, "22": [2, 31, 34, 37, 39, 41, 42, 49, 51, 62], "2200": 61, "22355853": 48, "224": [22, 49], "22471978829632": 51, "224x224": 31, "227250": 51, "229": 29, "23": [29, 31, 42, 62], "2300": 61, "23092487755584": 51, "23450678511424": 51, "2350": 37, "24": [29, 31, 51, 58], "2400": 61, "241": 29, "2488174077578": 57, "24_h": 51, "24x": 31, "25": [31, 62], "250": 58, "250221": 53, "25294047594070435": 28, "254": 29, "255": [19, 28, 35], "256": [28, 31, 35, 51, 62], "26": 35, "2600": 51, "2607155": 53, "2636094": 53, "26531240344047546": 28, "266": 29, "268435456": 2, "269": 28, "27": [16, 29, 32, 62], "272": 30, "27642": 42, "277716": 61, "277811": 61, "278": 29, "28": [29, 31, 32, 38, 42, 49, 51], "280": 62, "29": [29, 31], "290": 29, "298973": 53, "299": 35, "2nd": 41, "2tb": 31, "2x": [31, 35], "2x256x10": 62, "3": [2, 4, 7, 16, 18, 20, 22, 24, 25, 26, 28, 29, 30, 31, 32, 33, 35, 38, 39, 40, 41, 42, 45, 46, 49, 52, 53, 62], "30": [14, 16, 31, 35, 49, 51, 62], "3000765": 53, "3007": 31, "300x300": [31, 49], "302": 29, "303": 28, "305706": 53, "31": [29, 37], "312": [31, 51], "314010": 51, "314064": 51, "314090": 51, "314113": 51, "314135": 51, "314165": 51, "314197": 51, "314260": 51, "314455": 51, "314478": 51, "314505": 51, "314589": 51, "315": 29, "318963": 53, "32": [16, 18, 25, 26, 28, 29, 31, 33, 47, 51, 57, 61], "3200": 31, "3221133": 53, "3265": 31, "327": 29, "327398": 53, "328223477737884": 54, "33": 14, "3343554": 62, "3359": 28, "3359284": 62, "3364005982875824": 28, "339": 29, "3391027": 53, "34": 29, "3455": 28, "3461": 31, "35": [29, 31, 42], "350w": 31, "351": 29, "3549364": 53, "3555": 28, "3587": 31, "36": [29, 31, 35, 49], "364": 29, "3670": 28, "37": 16, "3753": 28, "376": 29, "3787665": 53, "38": [29, 31], "3804817": 53, "381424": 53, "384": 31, "3870": 31, "388": 29, "39": [29, 31], "3905785": 53, "3999124": 53, "3d": 44, "3dunet_itex": 55, "3dunet_itex_with_horovod": 55, "3e": [51, 57], "3f": 35, "3rd": [4, 21, 31, 41], "4": [14, 17, 18, 20, 24, 25, 28, 29, 30, 32, 35, 38, 51, 53, 58, 60, 62], "40": [14, 16, 29, 31, 42, 51], "400": [29, 61], "404": 29, "405": 29, "408512": 61, "4096": [19, 28], "40ghz": 31, "41": [16, 28], "41249612335034": 57, "413": 29, "416651": 62, "419072": 62, "42": 31, "42261": 53, "425": 29, "43": [16, 29, 31, 42], "435": 31, "438": 29, "44": [11, 16, 29], "4498": 28, "452": 29, "45x": 31, "461180928": 51, "465": 29, "47": [16, 29, 61], "4718971": 53, "479": 62, "479142": 53, "47eb": [37, 42], "48": [16, 29, 51, 61], "480": 29, "4800": 31, "481086": 53, "4818356": 53, "49": [29, 61], "4929404": 53, "494": 29, "4d": 25, "4th": [31, 41, 47], "5": [11, 18, 19, 20, 22, 25, 28, 30, 33, 35, 39, 40, 41, 51, 53, 57, 62], "50": [29, 31, 35], "5000": 31, "5063303": 53, "509": 29, "50ghz": 32, "51": [16, 29, 31, 51], "510076": 14, "51179520": 51, "512": [31, 51, 57], "5120": 62, "512x512": 31, "517385": 53, "52": [16, 28, 29, 51], "523": 31, "5294489860534668": 28, "53": [29, 31], "5300783": 53, "5333": 37, "54": 58, "5479512": 53, "549": 29, "55": [14, 16, 29, 31, 32, 35, 62], "550": 29, "555174": 61, "555221": 61, "5597944": 53, "56": [16, 29, 31, 32, 35], "57": 31, "5774": 51, "57x": 31, "58": 29, "586": 29, "59": [16, 29], "590331": 61, "594147": 62, "595": 51, "596": [37, 42, 51], "597": 51, "597360": 62, "598": 51, "5e": 51, "5th": 31, "6": [18, 26, 28, 30, 31, 33, 42, 49, 51], "60": [28, 29, 31, 35, 51], "600": [51, 61], "60000": [19, 28], "600w": 31, "601": 51, "602": 51, "6027272": 53, "602742": 61, "603262": 61, "604": [29, 51], "6047": 31, "605": 29, "606": 51, "607": 51, "6153628825864496": 47, "6240": 28, "63": [16, 29], "6336y": 31, "6342418": 53, "634554": 62, "64": [14, 16, 17, 19, 28, 29, 31, 35, 37, 39, 41, 42, 51, 56], "640x640": 49, "6416": 51, "6422923": 53, "6456823": 53, "6461415": 53, "6514435": 53, "65504": 28, "6628485": 53, "66fa74b6a2a0bb1e563ae8bce66496b118b95200": 54, "67": [16, 29, 31], "6761076": 53, "68": 29, "6867": 31, "69": 31, "692": 31, "6926193": 53, "693": 29, "694": 29, "69612": 49, "699": 31, "7": [18, 28, 29, 30, 31, 33, 49, 51, 54], "7090344": 53, "71": 29, "7112d33": 33, "718459": 53, "72": [29, 49], "7239000201225281": 28, "7296917": 53, "7297122": 53, "730m": 14, "736": 31, "74": 31, "7494": 28, "75": [29, 31], "7520": 28, "757": 29, "76": [25, 29, 31, 51], "768": 51, "768_a": 51, "772": 29, "773": 11, "7787259": 53, "784": [19, 28, 29, 35], "79": 29, "790128": 61, "790632": 62, "792936": 62, "795": 29, "7987": 28, "7f": 51, "8": [18, 25, 28, 29, 31, 33, 40, 41, 42, 49, 51, 52], "80": [29, 31], "800": 61, "803": [37, 42], "806": 29, "81": [31, 51, 54, 57], "810": 51, "817": 29, "8180m": 32, "8192": [19, 28], "81m": 28, "82574l": 31, "828": 29, "83": [29, 31, 32, 51], "839": 29, "83m": 28, "84": [29, 31, 32], "841192": 25, "8413447": 25, "8480": [31, 35], "84m": 28, "85": 35, "850": 29, "8500": [3, 34], "8501": 34, "8534": 28, "85485": 53, "8598063": 53, "85m": 28, "86": [16, 31], "8672705": 53, "867908472383153": 47, "87": [29, 31], "870": 31, "875052": 53, "8751": 28, "88": [29, 57], "8809638": 53, "8819": 28, "8863": 28, "8876": [37, 42], "888000e": 51, "8880196": 53, "8888": [41, 42, 47, 52, 54, 56], "88eb3cff2f03dad85035621d041e23a14345999": 55, "891": 29, "892": 29, "8941312": 53, "8972": 28, "89942324": 53, "8x16gb": 31, "9": [14, 18, 25, 26, 29, 30, 37, 38, 39, 41, 42, 45, 46, 56, 62], "9000": 5, "908": 29, "909": 29, "91": [29, 31], "911": 29, "9154005": 53, "9168000221252441": 28, "917546": 61, "917738": 61, "918": 31, "92": [29, 31], "924008369445801": 28, "9259825": 53, "9260886": 53, "9266936945121049176": 2, "928": 31, "92880015134813": 47, "92x": 31, "93": 31, "930": 29, "9349675": 53, "9373732": 53, "9377": 28, "9381000399589539": 28, "9381838": 53, "93901324": 53, "94": 16, "940695": 58, "9410": 28, "947": 29, "948": 29, "9486000537872314": 28, "949225": 53, "95": [29, 31], "951": 29, "9536000490188599": 28, "96": [29, 31, 40, 51], "9631021": 53, "9677248": 53, "968": 31, "96x": 31, "97": 16, "9702091": 53, "9746864": 53, "9755": 28, "98": 16, "9842": 31, "9873173": 53, "988714": 53, "99": 16, "9959502": 25, "9963627": 25, "999": [25, 26], "99998": 25, "A": [0, 5, 17, 18, 24, 28, 29, 32, 33, 34, 36, 42, 44, 47, 58], "And": [30, 37, 41, 42, 51], "As": [17, 24, 28, 29, 32], "At": [16, 17, 21, 45, 54], "Being": 0, "But": [27, 28], "By": [13, 20, 28, 29, 32, 52], "For": [0, 1, 2, 4, 7, 11, 14, 15, 18, 19, 20, 23, 25, 26, 28, 29, 31, 33, 34, 35, 37, 42, 47, 48, 49, 50, 51, 54, 55, 56, 57, 58, 60, 61, 62], "If": [2, 3, 5, 20, 22, 25, 26, 27, 28, 29, 32, 33, 35, 37, 39, 40, 41, 42, 45, 47, 48, 49, 51, 52, 53, 54, 55, 56, 57, 60], "In": [4, 11, 16, 18, 19, 27, 28, 29, 30, 32, 35, 36, 38, 45, 47, 49, 52, 53, 58, 62], "It": [4, 11, 14, 15, 16, 17, 18, 19, 20, 21, 28, 30, 32, 35, 36, 38, 39, 44, 51, 52, 55, 56, 60, 63], "NOT": [7, 14], "No": [0, 14, 19, 22, 35, 39, 47, 48, 51, 54, 55, 56, 57, 60], "Not": 20, "ON": [17, 31, 33, 47, 62], "Of": 51, "On": [28, 32, 37, 41, 42], "One": [29, 32], "That": [14, 32, 39, 40, 47], "The": [0, 2, 4, 5, 7, 9, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 24, 25, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 45, 47, 49, 51, 52, 55, 56, 57, 58, 60, 61, 62], "Their": 28, "Then": [3, 11, 22, 33, 41, 42, 52], "There": [21, 27, 36, 39, 45, 47, 52, 61], "These": [16, 24, 28, 29, 63], "To": [2, 3, 4, 7, 16, 18, 19, 24, 27, 28, 32, 36, 37, 39, 40, 41, 42, 45, 51, 52, 54, 55, 60], "With": [18, 19, 28, 29, 30, 45, 48, 53, 54], "_": [0, 11, 13, 14, 17, 18, 20, 22, 24, 27, 28, 29, 30, 32, 33, 34, 35, 37, 39, 40, 46, 47, 49, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61], "__del__": 56, "__init__": 35, "__main__": [29, 35], "__name__": 35, "__version__": [11, 33, 37, 39, 40, 41, 42, 63], "_gbs1_": 51, "_gbs2_": 51, "_pywrap_itex": 39, "_timestamp_inst": 29, "_timestamp_instance_n_cor": 29, "a100": 54, "a380": [39, 40], "a730m": [39, 40], "a930253": 33, "abl": 5, "about": [0, 7, 19, 32, 34, 35, 45, 51, 52, 58], "abov": [18, 19, 22, 28, 29, 32, 37, 47, 51, 52, 55, 56, 57, 58, 60, 62], "absolut": [29, 51], "abus": 0, "acceler": [4, 14, 16, 30, 31, 33, 44, 47, 52, 63], "accept": [0, 7, 17], "access": 37, "accmatmul": 24, "accord": [17, 18, 47, 56, 58, 61], "accordingli": 62, "account": 0, "accumul": 31, "accur": 36, "accuraci": [15, 18, 19, 25, 28, 44, 45, 52, 58, 61], "achiev": [18, 32], "acm": [39, 40], "across": [16, 20, 25], "act": [0, 21, 34], "action": [0, 5, 36], "activ": [11, 18, 19, 22, 25, 28, 32, 33, 37, 38, 39, 40, 41, 42, 46, 47, 48, 52, 53, 55, 56, 58, 60], "ad": [5, 13, 17, 18, 21, 23, 28, 39, 51, 62], "adam": 25, "adamw": 25, "adamwithweightdecayoptim": 26, "adapt": 0, "add": [3, 4, 5, 17, 18, 19, 24, 27, 32, 34, 37, 39, 40, 47, 54, 62], "add_weight": 35, "add_with_xla": 30, "addit": [8, 21, 23, 24, 32, 36, 40, 63], "addition": [18, 28], "addn": 24, "addon": [26, 58], "address": [0, 32, 37], "adher": 63, "adjust": [20, 25, 51], "adjusted_init_lr": 51, "adopt": [4, 15, 16, 21], "advanc": [0, 4, 20, 30, 33, 44, 63], "affect": [0, 18, 28], "affin": 32, "after": [2, 17, 18, 19, 22, 24, 26, 27, 28, 32, 33, 36, 37, 38, 42, 45, 51, 56], "afterward": [28, 29, 32], "ag": 0, "again": 28, "against": 7, "agent": 37, "aggress": [0, 16, 18, 19], "ahead": [39, 40], "ai": [44, 45, 50, 52, 63], "aim": 63, "aka": 21, "akdlm": [37, 42], "al": 25, "alexnet": 44, "alg": 11, "alg_kind_": 11, "algebra": [4, 16, 30], "algo": 11, "algorithm": [11, 25], "align": [0, 13], "all": [0, 7, 11, 14, 18, 20, 21, 25, 27, 28, 30, 32, 37, 42, 45, 47, 51, 62], "allocate_output": 11, "allow": [0, 16, 18, 28, 32, 35, 56, 63], "allowlist": 18, "allowlist_add": [18, 19], "allowlist_remov": 18, "almost": 21, "along": [30, 32], "alpha": 11, "alpha_": 11, "alreadi": [18, 28, 38, 45], "also": [0, 4, 7, 15, 16, 17, 19, 21, 23, 27, 28, 29, 30, 32, 36, 37, 38, 41, 42, 63], "altern": 18, "although": 32, "alwai": [18, 28, 36], "alwayslink": [11, 34], "am": 51, "amd64": [7, 37], "among": [29, 32], "amount": [14, 28], "amp": [4, 18, 29, 31, 44, 55, 60, 63], "ampthre": 18, "amx": 52, "amx_bf16": 52, "amx_int8": 52, "an": [0, 2, 3, 4, 7, 11, 13, 14, 16, 18, 19, 21, 24, 25, 27, 28, 29, 30, 32, 34, 35, 37, 38, 39, 40, 42, 44, 49, 52, 53, 57, 62, 63], "anaconda": 38, "analysi": [16, 32], "analyt": 45, "analyz": [16, 22], "ani": [0, 4, 11, 16, 20, 21, 23, 24, 27, 28, 29, 37, 38, 39, 42, 45, 53, 56], "annot": 17, "anoth": [29, 32, 36], "answer": 0, "antirectifi": 35, "aot": [39, 40], "apach": 63, "api": [4, 7, 9, 10, 14, 15, 16, 19, 25, 26, 27, 28, 30, 32, 34, 40, 52, 53], "apolog": 0, "apologi": 0, "appear": [0, 28], "append": [35, 37, 41, 42], "appli": [0, 16, 17, 25, 28, 33, 34, 51, 54, 55, 57, 60, 62], "applic": [4, 21, 23, 31, 32, 33, 34, 36, 45], "apply_gradi": 28, "appoint": 0, "approach": [4, 16, 38], "appropri": [0, 3, 32, 39, 40], "approv": 7, "approxim": [11, 25], "approximate_": 11, "apt": [7, 34, 37, 39, 42], "ar": [0, 2, 4, 5, 7, 11, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 32, 34, 36, 37, 39, 40, 41, 42, 44, 45, 47, 51, 52, 53, 55, 58, 61, 63], "arang": 25, "arc": [14, 39, 40, 42, 47, 63], "arch": 37, "architectur": [11, 16], "archiv": 37, "area": 13, "arg": [2, 13, 33], "argument": [13, 25, 28, 29, 33], "around": [0, 29, 51], "arrai": 25, "articl": 32, "as_graph_el": 35, "ask": [4, 36, 39, 40], "aspect": 28, "assign": [29, 32, 40], "assign_i": 40, "assign_x": 40, "assist": 8, "assum": [17, 28, 32, 38, 39, 40, 51, 55, 60], "assumpt": [2, 3], "astyp": [19, 28, 35, 53], "ats": [39, 40], "atsp": 28, "attach": [2, 3, 28, 32], "attack": 0, "attent": [0, 20], "attr": [11, 20], "attribut": [24, 33], "auto": [4, 11, 17, 27, 29, 30, 33, 40], "auto_mixed_precis": [18, 19, 33, 47], "auto_mixed_precision_log_path": [20, 33], "auto_mixed_precision_opt": [18, 19, 47], "auto_mixed_precision_optionsgraph_opt": 18, "auto_mod": [17, 62], "auto_sharding_pass": 17, "auto_sharding_pass_mlir": 17, "autom": [21, 29], "automat": [4, 5, 16, 17, 18, 19, 21, 26, 28, 29, 31, 32, 33, 37, 42, 44, 48, 53, 62], "automixedprecis": 18, "automixedprecisionopt": [18, 19, 47], "automixedprecosionopt": 18, "autoshard": [17, 62], "ava": 49, "avail": [0, 2, 3, 11, 14, 19, 25, 29, 32, 35, 36, 39, 40, 41, 42, 55], "averag": 51, "avgpool": [18, 19, 49], "avgpool3d": [18, 19], "avoid": [0, 4, 24, 27, 28, 29, 32, 35, 38, 51], "avx512": [4, 21, 52], "avx_vnni": 52, "awk": 51, "axi": [25, 26, 35], "b": [30, 35, 40, 47, 49, 51, 52, 61, 62], "b4ab4b8f8b3a41fade4899fd00b5b2d2dad0981f3e1bb10df4c522975fd7": 40, "b7a8": [37, 42], "ba": 25, "back": [17, 28, 39], "backend": [4, 16, 21, 23, 26, 27, 28, 33, 42, 47, 48, 52, 53, 63], "background": 32, "background_thread": 29, "backward": [11, 28], "balanc": [18, 19, 31, 35], "bare": 44, "base": [7, 11, 14, 15, 16, 18, 19, 25, 31, 32, 37, 38, 41, 44, 47, 51, 52, 57, 58, 62, 63], "base_config": 35, "base_shap": 35, "basekit": [37, 38, 42], "bash": [2, 37, 38, 39, 40, 47, 51, 52, 60, 63], "bashrc": 38, "basi": 37, "basic": [18, 19, 20, 28], "batch": [17, 25, 28, 29, 31, 51, 62], "batch_siz": [16, 17, 19, 28, 35, 55, 62], "batch_size_per_gpu": 51, "batchmatmul": [24, 26], "bazel": [3, 11, 34], "bazelbuild": [7, 39, 40], "bazelrc": 39, "becaus": [18, 19, 28, 36], "becom": [13, 32, 36], "been": [28, 32, 54, 62], "befor": [5, 7, 11, 16, 18, 19, 24, 27, 28, 29, 32, 35, 36, 39, 40, 44, 62], "begin": [7, 11, 47], "behavior": [0, 27, 28, 29, 32, 36, 51], "being": 32, "below": [2, 3, 24, 25, 28, 29, 30, 31, 32, 33, 37, 39, 42, 51, 56], "benchmark": [7, 16, 31, 35, 55, 61], "benefit": [4, 21, 28, 32, 33], "bert": [16, 20, 25, 36, 44], "bert_base_dir": 16, "bert_base_model": 16, "bert_config": [16, 57], "bert_config_fil": [16, 57], "bert_larg": 16, "bert_large_dir": 57, "bert_model": [51, 57], "bert_prep_working_dir": 51, "besid": [21, 32], "best": [0, 14, 16, 27, 37], "beta": 11, "beta_": 11, "beta_1": [25, 26], "beta_2": [25, 26], "beta_constraint": [25, 26], "beta_initi": [25, 26], "beta_regular": [25, 26], "better": [4, 15, 16, 18, 19, 21, 24, 25, 27, 29, 32, 35, 36, 44, 51, 52, 54, 55, 60], "between": [16, 17, 18, 19, 21, 32, 34, 35, 39, 54, 61, 62], "bf16": [18, 19, 24, 31, 44, 45, 47, 51, 55, 60, 61, 62], "bf32": 20, "bfloat16": [4, 11, 18, 19, 21, 24, 28, 33, 47, 51, 55, 57, 60], "bfloat16graph_opt": 19, "bia": [13, 20, 24, 53], "bias_add": 53, "bias_initi": [25, 26], "biasadd": [20, 26], "biasaddgrad": 24, "big": 45, "bin": [3, 7, 11, 29, 34, 39, 40, 46, 47, 48, 52, 55, 56, 58, 60], "bin_threadpool": 3, "binari": [18, 34, 39, 40], "bind": [13, 30, 32, 40], "bind_al": 22, "bit": [15, 18, 28, 33, 37, 39, 41, 42, 47], "blob": [21, 34], "block": [11, 32, 33, 35, 36, 42], "blocker": 45, "blocktim": 32, "blog": 16, "board": 31, "bodi": 0, "bookcorpu": [31, 51], "bool": 11, "boolean": [24, 29], "boost": [4, 21, 29, 31, 32], "both": [4, 7, 14, 15, 18, 19, 23, 27, 29, 30, 31, 32, 33, 39, 47, 61], "bound": 32, "box": 15, "brain": 55, "branch": [5, 7, 39], "break": 24, "bridg": [21, 34], "briefli": 32, "bring": [23, 28, 29, 63], "browser": [5, 22, 41, 42, 49, 52, 54, 56], "bs1": 49, "bt": 35, "bu": [2, 30], "buffer": [16, 49], "bug": [7, 63], "buid": 40, "build": [4, 7, 9, 35, 43, 44, 45, 51, 63], "build_doc": 5, "build_pip_packag": [11, 39], "build_tmp": 5, "build_with_threadpool": 40, "builder": 61, "buildifi": 7, "buildtool": 7, "built": [11, 16, 34, 41, 42], "bus_id": 2, "busi": 32, "bzl": 7, "c": [2, 4, 10, 11, 14, 29, 30, 32, 35, 37, 38, 39, 41, 42, 43, 56, 63], "c481324031ecf0f70f8939516c02e16cac60446d": 60, "c_api_experiment": 40, "c_str": 40, "cach": [12, 15, 32, 35, 51], "calcul": [29, 54], "calibr": 52, "call": [11, 15, 16, 26, 28, 30, 32, 33, 35, 36, 43, 46, 52, 53, 56, 57], "callabl": 56, "can": [2, 3, 4, 7, 11, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 25, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 45, 51, 55, 56, 60, 61, 62, 63], "cannot": [14, 18, 27, 35, 47, 48, 51, 54, 55, 57, 60], "capabl": [4, 14, 27, 28], "capi": 30, "card": [20, 51, 58], "case": [4, 13, 18, 19, 21, 28, 29, 32, 35, 47], "cast": [0, 18, 24, 28, 49], "cat": 29, "catch": 11, "caus": [27, 28, 32, 35, 56], "cbica": 55, "cc": [3, 11, 14, 17, 28, 30, 34, 42, 58, 62], "ccl": [38, 42], "cd": [2, 5, 7, 16, 32, 34, 39, 40, 47, 51, 54, 55, 57, 58, 60, 62], "cell": [28, 54], "center": [1, 4, 16, 21, 25, 26, 33, 39, 40, 42, 45, 47, 50, 51, 52, 54, 55, 56, 57, 58, 60, 61, 62, 63], "cento": 41, "certain": [16, 29, 32], "challeng": 55, "chanc": [18, 28], "chang": [4, 5, 7, 11, 18, 19, 20, 21, 23, 27, 28, 29, 30, 36, 38, 44, 45, 56, 58], "channel": [0, 24, 25, 43], "channels_last": 62, "characterist": 0, "cheap": 35, "check": [5, 7, 11, 13, 14, 18, 19, 21, 23, 28, 29, 37, 38, 39, 40, 45, 46, 47, 57, 63], "checker": 32, "checkout": [5, 34, 40, 55, 60, 62], "checkpoint": 51, "choos": [16, 23, 25, 27, 28, 29, 32, 35, 39, 40, 43, 47, 49, 52, 53, 55], "chrome": 5, "circular": 27, "ckpt": [51, 57], "clang": 7, "clarifi": 0, "clariti": 0, "class": [0, 11, 28, 33, 35], "classic": 32, "classif": 22, "classifi": [44, 61], "classifier_train": 61, "classify_text_with_bert": 56, "claus": [4, 21, 23], "clean": [11, 40], "clearlist": 18, "clearlist_add": 18, "clearlist_remov": 18, "click": [11, 39, 40], "client": [2, 30, 40], "client_sess": 40, "clientsess": 40, "clock": 14, "clone": [5, 16, 34, 39, 40, 51, 54, 55, 57, 60, 61, 62], "close": [25, 27, 32], "closer": 24, "cluster": [27, 38], "cm": 37, "cmake": 39, "cnn": [18, 31, 32, 44, 45], "co": [4, 14, 15, 21], "coco": [31, 49, 60], "coco17": 49, "code": [2, 4, 5, 9, 11, 16, 20, 21, 22, 23, 27, 30, 31, 32, 34, 35, 43, 44, 45, 47, 49, 52], "codebas": [4, 30], "codenam": 4, "colab": 28, "collabor": [16, 63], "collect": [2, 32, 42], "color": 0, "com": [0, 5, 7, 8, 16, 21, 28, 32, 34, 35, 37, 38, 39, 40, 42, 45, 47, 49, 51, 52, 54, 55, 56, 57, 58, 60, 61, 62, 63], "combin": [16, 21, 29, 32, 54], "come": 4, "comma": 32, "command": [2, 3, 14, 22, 29, 32, 37, 38, 39, 40, 41, 42, 46, 47, 49, 52, 57], "comment": [0, 7, 14], "commit": [0, 5, 17, 34], "common": [0, 11, 14, 17, 21, 32, 44, 51], "common_runtim": [11, 30], "commonli": 32, "commun": [0, 2, 7, 9, 21, 23, 32, 42, 63], "compact": [29, 32, 35], "compar": [16, 18, 28, 32, 44], "compat": [2, 3, 4, 15, 19, 21, 23, 26, 28, 30, 33, 35, 51, 52, 54, 55, 56, 57, 60, 61], "compet": 32, "competit": 32, "compil": [4, 11, 14, 16, 19, 21, 27, 28, 30, 32, 33, 34, 35, 36, 37, 38, 40, 42], "compiler_vers": 33, "complaint": 0, "complet": 32, "complic": [21, 29], "compon": [17, 19, 31, 33, 37, 38, 39, 40, 42], "compos": 17, "compressor": [4, 15, 21, 44, 45, 52], "comput": [4, 11, 15, 16, 25, 28, 32, 35, 37, 45, 53, 54, 63], "compute_dtyp": 28, "compute_gradi": 28, "concat": 35, "concaten": [35, 54], "concatv2": 49, "concept": [16, 28, 32], "concrete_funct": 35, "concurr": [4, 13, 20, 32, 35], "conda": [4, 14, 43, 51, 56], "conda_prefix": 29, "conduct": [7, 29], "conduit": [4, 30], "conf": 29, "config": [11, 14, 17, 18, 19, 28, 34, 35, 37, 39, 40, 42, 47, 52, 58, 61, 62], "config_fil": 61, "configproto": [17, 18, 19, 47, 52, 62], "configur": [4, 8, 11, 14, 17, 19, 21, 23, 28, 29, 33, 35, 37, 42, 49, 61, 63], "confirm": [29, 39, 40], "conflict": 35, "conform": 7, "connect": 32, "consecut": 32, "consequ": 0, "consid": [0, 18, 58], "consist": [7, 28], "consol": 42, "const": 40, "constant": [11, 15, 16, 25, 26, 28, 30], "constant_fold": 52, "constraint": 25, "construct": [0, 11, 17, 28], "constructor": 28, "consum": 51, "consumpt": [19, 21, 28, 47], "contact": 8, "contain": [5, 9, 15, 17, 27, 29, 32, 34, 43, 44, 55, 60, 63], "content": [5, 40, 42], "context": [11, 25, 32], "contigu": 32, "continu": [0, 14, 18, 27, 28], "contrast": 16, "contribut": [0, 4, 14, 21, 29, 39], "contributor": [7, 63], "control": [31, 32, 44, 52, 62], "conv": [17, 24, 53], "conv2d": [4, 21, 49, 53], "conv3d": 24, "convent": 7, "convers": [17, 18, 19, 24], "convert": [15, 16, 17, 18, 19, 28, 36, 45, 47, 49, 55, 61], "convert_to_tensor": 11, "convgradfilt": 24, "convolut": 32, "cooper": [4, 21, 44, 49, 52], "copi": [2, 3, 40], "copt": [11, 34], "copyright": 7, "core": [9, 11, 14, 17, 26, 28, 30, 31, 32, 35, 39, 40, 42, 52, 53, 58, 62], "core_id": 29, "core_list": 29, "correct": [28, 35, 39, 40], "correspond": [18, 29, 30, 36], "correspondli": 61, "cost": 15, "costli": 32, "could": [0, 18, 28, 33, 40, 45, 51, 52], "count": 14, "coupl": 32, "coven": [7, 63], "cover": [19, 21, 24, 29, 32], "cp": [3, 40, 51], "cp311": 40, "cpp": [3, 14, 17, 37], "cpplint": 7, "cpu": [2, 3, 4, 9, 11, 14, 15, 16, 18, 19, 20, 23, 24, 28, 31, 33, 34, 36, 43, 44, 45, 49], "cpudevic": 11, "cpunodebind": 32, "crash": 56, "creat": [11, 18, 28, 29, 30, 33, 36, 38, 42, 46, 49, 52, 55, 60, 62], "create_datasets_from_start": 51, "creatednnlengin": 11, "creatednnlstream": 11, "creation": 13, "critic": 18, "cross": [29, 32], "ctl": 61, "ctx": 11, "cuda": 28, "cuda_diagnost": 28, "cuda_driv": 28, "cuinit": 28, "curl": 38, "current": [14, 17, 22, 33, 51, 55, 60, 62], "custom": [4, 7, 9, 16, 18, 21, 26, 27, 29, 33, 37, 42, 51], "custom_graph_optimizer_registri": 58, "cv": 54, "cvfh": 3, "d": [7, 35, 37, 39, 40, 61], "d50dnp1sbb": 31, "dai": 51, "danger": 18, "dashboard": 22, "data": [4, 15, 16, 17, 18, 21, 22, 25, 28, 33, 35, 39, 40, 42, 45, 47, 49, 50, 51, 52, 54, 55, 56, 57, 58, 60, 61, 62, 63], "data_dir": [16, 51, 55, 60, 61], "data_f32": 11, "data_format": [20, 62], "data_typ": [18, 19, 47], "dataset": [19, 28, 31, 35, 52, 58], "dataset_dir": [55, 60], "datatyp": [33, 40, 51, 55, 60], "dch": 37, "dcmake_build_typ": 39, "ddr4": 31, "ddr5": 31, "de6201297144": [37, 42], "dealloc": 32, "dearmor": 37, "deb": [37, 39], "debug": [11, 20, 22, 33], "debugalloc": 32, "decai": 25, "decayed_learning_rate_at_crossover_point": 51, "decid": 17, "decis": [0, 17], "declar": 11, "decoupl": [25, 30], "dedic": 7, "deem": 0, "deep": [15, 25, 27, 32, 36, 44, 63], "deeper": 23, "deeplearningexampl": [31, 51, 55, 60], "def": [28, 30, 35], "default": [4, 7, 13, 14, 15, 18, 19, 20, 21, 23, 27, 28, 30, 31, 32, 33, 35, 39, 40, 51, 52, 53, 60, 61, 62], "default_data_typ": [18, 33], "default_dataset": 49, "default_static_qconfig": 49, "defin": [4, 16, 28, 40], "definit": [7, 18, 23, 33], "deleg": 15, "deliv": [4, 19, 21, 27], "delta_tim": 35, "demand": [13, 63], "demo": 22, "demonstr": [0, 31, 44], "denali": 31, "deni": 18, "dens": [19, 20, 28, 35], "dense1": 28, "dense2": 28, "dense_1": [19, 28], "dense_2": [19, 28], "dense_logit": [19, 28], "denylist": 18, "denylist_add": 18, "denylist_remov": 18, "dep": [11, 34], "depend": [14, 16, 19, 29, 32, 36, 37, 39, 40, 42], "deploi": [21, 34], "deploy": [38, 41, 42], "deprec": 39, "depthwiseconv2dn": 49, "dequant": [49, 52], "derogatori": 0, "desc": [11, 13], "descibl": 11, "describ": [25, 28, 29, 32], "descript": [9, 13, 18, 29, 32, 33, 44, 56], "descriptor": 11, "design": [4, 7, 9, 21, 30, 34, 45], "desir": [18, 29], "destruct": 32, "detail": [2, 3, 11, 15, 16, 17, 18, 19, 21, 23, 25, 28, 32, 33, 36, 37, 39, 40, 42, 45, 47, 51, 63], "detect": [32, 49], "determin": [0, 11, 28, 32], "dev": [2, 3, 14, 22, 34, 39, 42, 47, 57], "develop": [4, 14, 16, 21, 30, 32, 37, 39, 40, 41, 42, 63], "deviat": 25, "devic": [2, 3, 4, 9, 10, 11, 13, 14, 16, 17, 19, 20, 21, 22, 23, 24, 28, 33, 34, 39, 40, 42, 47, 62, 63], "device_cpu": 11, "device_gpu": [11, 17, 62], "device_lib": 2, "device_num": [17, 62], "device_typ": [2, 14, 17, 39, 40, 58, 62], "diagram": 63, "dialect": [16, 17], "dict": 35, "did": [28, 32], "diff_undef": 11, "diffent": 27, "differ": [0, 2, 4, 13, 16, 20, 21, 23, 25, 29, 30, 32, 33, 35, 36, 43], "differenct": [39, 40], "differenti": 39, "difficult": 30, "diffus": [44, 63], "digit": [19, 28], "dim": 13, "dimens": 17, "dir": [2, 3, 7, 51, 55, 56, 57, 60], "directli": [11, 14, 17, 27, 28, 29, 32, 36, 42], "directori": [2, 3, 4, 5, 7, 14, 17, 29, 34, 37, 39, 40, 42, 47, 48, 49, 51, 54, 55, 57, 60], "diretcori": 40, "disabl": [0, 15, 19, 27, 29, 30, 32, 33], "disable_numactl": 29, "disable_taskset": 29, "disbal": 39, "discontinu": 14, "discuss": 7, "disk": [36, 49], "disparag": 0, "displai": [20, 49], "distanc": 54, "distinguish": [28, 30], "distribut": [2, 4, 8, 31, 32, 37, 38, 42, 43, 44, 51, 60, 61, 63], "distribution_strategi": 62, "divers": 0, "divid": [25, 28, 32], "divis": 28, "dl": 7, "dll": 51, "dllogger": [55, 60], "dllvm_enable_project": 39, "dnnl": [11, 13], "dnnl_arg_dst": 11, "dnnl_arg_scratchpad": 11, "dnnl_arg_src": 11, "do": [7, 14, 19, 27, 28, 29, 33, 36, 39, 52], "do_benchmark": 35, "do_lower_cas": 16, "do_predict": [16, 57], "do_train": [16, 57], "doc": [5, 9, 11, 39, 56], "doc_strid": 57, "docker": [9, 43, 44], "dockerfil": 2, "dockerhub": 63, "docs_build": 9, "docstr": 11, "document": [2, 3, 28, 31, 36, 38, 39, 40], "doe": [16, 24, 27, 28], "doesn": [5, 17, 18, 36, 56], "domin": 28, "don": [28, 49], "done": [7, 22, 28, 32, 35, 37], "doubl": 28, "download": [2, 8, 28, 32, 37, 42, 49, 51, 60, 61], "download_and_preprocess_coco": 60, "downstream": 18, "dpc": [21, 37, 38, 39, 40, 42], "dpcpp": [33, 37], "draft": 5, "dramat": 32, "dri": [2, 3, 34, 42, 47], "drive": 35, "driver": [2, 3, 14, 28, 31, 38, 45, 47, 52, 63], "drop": [18, 29, 35], "dropout": 35, "dst_mem": 11, "dst_tensor": 11, "dt_float": [20, 40], "dtype": [11, 19, 25, 26, 30, 35, 53, 62], "dtype_polici": 28, "due": [18, 27, 32, 35], "dummi": [31, 49, 61], "dummy_v2": 49, "dump": [20, 35], "duplic": 39, "dure": [0, 15, 16, 18, 19, 24, 28, 36, 38, 39, 40, 47], "dut3046": 28, "dynam": [13, 28, 32, 35, 36], "e": [0, 2, 3, 5, 11, 17, 28, 29, 34, 40, 60, 61], "each": [14, 25, 28, 29, 30, 31, 32, 62], "eager": [11, 25], "earli": 37, "easi": [16, 21, 30, 45], "easiest": 38, "easili": [16, 30, 31, 33], "ecc": 31, "echo": [37, 51], "econom": 0, "ecosystem": [16, 30, 63], "ed": 40, "edit": [0, 2], "edu": 55, "educ": 0, "effect": [18, 29, 32], "effici": [4, 16, 21, 30, 32, 34, 35, 51, 62, 63], "effort": 37, "egg": 60, "eigen": [4, 20], "either": [3, 19, 27, 49], "elaps": [32, 49], "elig": 11, "elimin": [16, 36], "els": [19, 28, 40, 61], "eltwis": 11, "eltwise_bas": 11, "eltwise_base_hdr": 11, "eltwise_forward": 11, "eltwise_gelu_erf": 11, "eltwise_gelu_tanh": 11, "eltwise_relu": 11, "eltwisebaseop": 11, "elu": 24, "email": 0, "emit": 16, "empathi": 0, "empir": 25, "en": 42, "enabl": [4, 13, 15, 16, 17, 18, 21, 22, 25, 27, 28, 29, 30, 31, 32, 33, 35, 36, 38, 39, 40], "enable_checkpoint_and_export": 62, "enable_itex_amp": 29, "enable_itex_layout_opt": 29, "enable_jemalloc": 29, "enable_op_parallel": 29, "enable_tcmalloc": 29, "enable_tensorboard": 62, "enable_tf_profil": [4, 21, 22, 28], "enable_xla": 62, "encod": 20, "encompass": 16, "encount": 14, "end": [28, 35, 39, 40, 44, 45, 52], "engin": [11, 14], "enhanc": [4, 30], "ensur": [7, 29], "enter": [2, 3, 22, 38, 39, 40], "enterpris": [31, 42], "entir": 28, "entri": 17, "enum": 33, "env": [14, 34, 38, 39, 40, 42, 46, 51, 52, 54], "env_check": [37, 38, 42, 63], "env_itex": [46, 47, 52, 54, 55, 56, 58, 60], "env_itex_cpu": [48, 56], "env_nam": 46, "environ": [0, 2, 4, 11, 13, 15, 16, 19, 21, 22, 23, 27, 28, 30, 32, 34, 35, 43, 44, 63], "environment": [30, 40], "epoch": [18, 19, 28, 35, 51, 58, 60], "epoch_loss_avg": 28, "epsilon": [25, 26], "equal": [24, 27, 32], "equival": [4, 28], "error": [4, 7, 11, 14, 20, 25, 28, 34, 47, 48, 51, 54, 55, 56, 57, 60], "errors_impl": [14, 47, 48, 51, 54, 55, 57, 60], "especi": [13, 38], "estim": [36, 63], "et": 25, "etc": [21, 30, 37, 39], "ethernet": 31, "ethnic": 0, "eu": 14, "eval_batch_s": 51, "evalu": [19, 28, 35, 54, 57], "even": [28, 29, 32, 43, 51, 63], "event": 0, "everi": [18, 20, 54], "everyon": 0, "evo": 31, "evolv": 30, "exact": 31, "exact_match": [51, 57], "exactli": 30, "exampl": [0, 2, 4, 5, 7, 9, 11, 14, 15, 20, 21, 24, 25, 26, 28, 31, 32, 33, 34, 37, 38, 45, 47, 50, 52, 56, 63], "example_test": 40, "except": [30, 33, 42, 51], "excess": 30, "exclud": 7, "exclus": 29, "excutor": 27, "exec": [11, 13], "exec_mod": 55, "execut": [2, 5, 11, 13, 15, 16, 17, 18, 19, 20, 22, 25, 28, 31, 32, 36, 39, 44, 52, 53], "executor": 15, "exist": [19, 24, 26, 28, 29, 45], "exit": 34, "exp": 18, "expect": [18, 38, 52, 63], "experi": [0, 4, 21, 23, 32], "experiment": [4, 13, 14, 22, 33, 39, 40, 42], "experimental_compil": 30, "experimental_gelu": 16, "experimental_ops_overrid": [26, 33], "explain": 18, "explan": 0, "explicit": [0, 11, 28, 32], "explicitli": [28, 29, 33, 52], "export": [4, 7, 11, 15, 16, 17, 18, 19, 21, 22, 28, 29, 30, 32, 34, 37, 38, 40, 42, 46, 47, 51, 52, 54, 57, 61, 62, 63], "expos": [21, 22, 63], "expr": 51, "express": 0, "extend": [4, 14, 21, 23, 25, 30, 32, 33], "extens": [5, 8, 9, 11, 14, 15, 16, 17, 18, 19, 20, 21, 22, 24, 25, 26, 28, 29, 30, 31, 32, 36, 38, 43, 44, 46, 47, 48, 50, 51, 53, 54, 55, 56, 57, 58, 60, 61, 62], "extent": 31, "extern": [0, 14, 40], "extra": [18, 28, 36], "extract": 51, "f": [2, 35, 40, 63], "f0": 11, "f1": [51, 57], "f502f0715979ec73c571ca5676ba58431b916f5f58ee3333": 56, "facilit": [4, 30], "factor": [21, 29], "fail": [11, 28, 33, 36], "fair": 0, "fairli": 0, "fallback": 25, "fals": [7, 16, 17, 25, 27, 28, 29, 35, 51, 57, 62], "familiar": 11, "faq": 0, "far": 28, "fashion": [4, 21], "fast": 25, "faster": [18, 19, 25, 27, 28, 32, 35, 36, 47, 49], "fatal": 14, "fdc7a2bc": [37, 42], "featur": [4, 7, 8, 11, 13, 17, 25, 32, 36, 39, 44, 52, 62, 63], "feedback": [0, 7], "fetch": 40, "few": [28, 61], "fewer": 28, "fi": 61, "fi_provid": 38, "fid": 54, "field": [33, 39, 40], "fig": [16, 36], "figur": [16, 30, 32], "file": [2, 5, 7, 14, 17, 18, 22, 29, 34, 37, 42, 47, 48, 49, 51, 54, 55, 56, 57, 60, 61, 63], "filenam": 35, "fill": [39, 40], "filter": 7, "filter_height": 53, "filter_width": 53, "final": [17, 19, 28, 51], "final_carry_st": 25, "final_memory_st": 25, "find": [7, 11, 22, 31, 32, 34, 36], "fine": [28, 29, 31, 32, 35, 51], "finish": [28, 35, 39, 53, 56], "first": [17, 18, 19, 22, 24, 25, 27, 28, 29, 30, 32, 37, 38, 39, 41, 42, 51, 55, 60], "fit": [19, 32, 35], "fix": [7, 28, 37], "flag": [17, 30, 40, 60], "flex": [39, 40, 42, 45, 47, 50, 52, 54, 57, 63], "flexibl": [4, 30, 33, 35], "flexibli": 63, "float": [11, 18, 20, 28, 33, 40, 47], "float16": [4, 16, 18, 19, 21, 28, 33, 47], "float16graph_opt": [18, 19], "float32": [11, 19, 24, 25, 26, 28, 30, 35, 51, 53, 55, 60], "flow": [16, 28], "flower": 52, "focus": [0, 30], "fold": 15, "folder": [2, 3, 19, 34, 39, 40, 61], "follow": [0, 2, 3, 7, 15, 16, 17, 18, 22, 24, 27, 28, 29, 31, 32, 33, 34, 35, 37, 38, 39, 40, 41, 42, 43, 45, 47, 48, 51, 53, 54, 55, 56, 57, 60, 61, 62, 63], "follw": 62, "footprint": 36, "forg": [14, 56], "fork": [32, 35], "format": [7, 9, 18, 24, 28, 33, 35, 36, 61], "forth": 63, "forward": [11, 28, 54], "forward_train": 11, "found": [7, 14, 28, 29, 32, 34, 36, 39, 51], "four": 18, "fp": 47, "fp16": [16, 18, 19, 31, 44, 47, 51], "fp32": [16, 18, 19, 20, 24, 31, 44, 45, 49, 51, 52, 60], "fpn": 49, "fraction": 16, "framework": [14, 16, 30, 35, 36, 37, 40, 47, 48, 50, 51, 54, 55, 57, 60], "free": [0, 21, 29], "frequenc": [14, 31], "frequent": [4, 36], "friendli": 32, "from": [0, 3, 5, 7, 11, 16, 17, 18, 19, 21, 22, 27, 28, 29, 30, 32, 33, 35, 36, 37, 39, 43, 44, 47, 49, 50, 51, 52, 55, 56, 63], "from_logit": 35, "from_model": 49, "from_tensor_slic": 28, "frontend": [4, 16, 21, 23], "frozen": 19, "fr\u00e9chet": 54, "full": [7, 39, 40, 42], "fulli": [4, 19, 21, 30, 35], "function": [5, 17, 20, 21, 23, 25, 26, 28, 30, 32, 33], "fundament": 16, "further": [4, 16, 21], "fuse": [4, 16, 18, 19, 21, 24, 26, 51], "fusedaccmatmul": 24, "fusedbatchnorm": 24, "fusedbatchnormgrad": 24, "fusedmatmul": 24, "fusion": [4, 9, 17, 18, 19, 21, 26, 33], "fwd_desc": 11, "fwd_pd": 11, "fwd_primit": 11, "fwd_primitive_arg": 11, "g": [5, 17, 28, 40, 56, 61], "g10": [39, 40], "g11": [39, 40], "gamma_constraint": [25, 26], "gamma_initi": [25, 26], "gamma_regular": [25, 26], "gate": 25, "gaussian": 25, "gb": 31, "gbs1": 51, "gbs2": 51, "gcc": [33, 39], "gd": 35, "gddr6": 31, "gelu": [11, 33], "gelu_erf": 24, "gelu_tanh": 24, "geluop": 11, "gen": 31, "gen9": 11, "gender": 0, "gener": [4, 5, 16, 20, 21, 23, 28, 29, 30, 31, 32, 34, 38, 39, 41, 47, 49, 52], "get": [2, 4, 7, 11, 13, 21, 28, 31, 32, 33, 34, 35, 37, 39, 40, 47, 48, 51, 54, 55, 57, 60, 63], "get_concrete_funct": 35, "get_config": 35, "get_scaled_loss": 28, "get_unscaled_gradi": 28, "get_weight": 28, "getattr": 11, "getsitepackag": [37, 38, 42, 63], "gh": 5, "ghz": 31, "gigabit": 31, "gin": 58, "git": [5, 11, 16, 33, 34, 39, 40, 47, 51, 54, 55, 57, 58, 60, 61, 62], "git_vers": [33, 38], "github": [5, 7, 8, 16, 21, 32, 34, 39, 40, 45, 47, 51, 54, 55, 57, 58, 60, 61, 62, 63], "give": [0, 35], "given": [17, 25, 29, 55], "glibcxx": 14, "glibcxx_3": 14, "global": [17, 28, 33, 62], "glorot_uniform": [25, 26], "glue_dataset": 16, "glue_dir": 16, "go": [7, 40, 41, 42], "go1": 7, "golang": 7, "gold": 31, "gomp": 32, "gomp_cpu_affin": 32, "good": [4, 19, 21, 23, 32, 34, 36], "googl": [7, 14, 16, 21, 22, 34, 57], "google_pretrained_weight": 51, "googleapi": [28, 35, 47, 49, 56], "govern": 63, "governor": 31, "gperftool": 32, "gpg": [37, 39], "gpu": [3, 4, 9, 11, 14, 15, 16, 18, 19, 20, 23, 24, 25, 27, 28, 33, 34, 38, 43, 44, 49, 63], "gpu_kernel": 11, "gpu_profil": 28, "gpudevic": 11, "gracefulli": 0, "grad": 28, "gradient": 28, "gradienttap": 28, "granular": [29, 32, 35], "graph": [4, 9, 10, 13, 15, 16, 18, 20, 23, 30, 35, 36, 44, 53, 62, 63], "graph_def": 35, "graph_opt": [17, 18, 19, 33, 47, 52, 62], "graph_pb2": 35, "graphdef": [17, 18, 35], "graphic": [37, 39, 40], "graphopt": [17, 18, 19, 47, 62], "grappler": [15, 17, 19, 58], "greater": [24, 32], "greaterequ": 24, "greatli": 28, "green": 15, "grep": 52, "group": [25, 32], "gt": [18, 33, 62], "guarante": 37, "guid": [4, 9, 11, 18, 21, 28, 31, 34, 37, 39, 40, 42, 44, 45, 52, 63], "guidelin": [1, 4, 16, 50, 63], "guidlin": 31, "gxx_linux": [14, 56], "gz": [7, 32, 49], "h": [7, 11, 14, 17, 34, 40], "ha": [2, 3, 4, 14, 18, 19, 20, 28, 30, 32, 36, 37, 40, 51, 62], "had": [28, 32], "half": [11, 28], "halv": 28, "hand": 16, "handl": [1, 13], "handwrit": [44, 45], "happen": [28, 36, 56], "harass": 0, "hard": [2, 54], "hardwar": [4, 16, 17, 19, 21, 23, 25, 29, 33, 35, 44], "harm": 0, "hasattr": [11, 33], "hasn": 54, "hat": 42, "have": [0, 18, 28, 32, 37, 38, 39, 42, 45, 49, 52], "hbm2e": 31, "hdr": [11, 34], "he": 25, "he_norm": 35, "header": 11, "headless": 60, "healthi": 0, "heap": 32, "help": [14, 19, 20, 21, 29, 32, 39, 40, 45, 52], "here": [8, 11, 14, 17, 18, 24, 27, 30, 35, 36, 39, 40, 49, 51, 54, 55, 60, 62], "heterogen": [17, 63], "heurist": 17, "high": [14, 16, 17, 28, 32, 63], "higher": [14, 15, 20, 28, 32], "highli": 28, "histori": [19, 28], "hlo": 16, "hochreit": 25, "hold": 32, "home": [7, 29, 37, 41, 42, 56], "homogen": 17, "hook": 17, "horovod": [2, 31, 37, 38, 42, 44, 51, 60], "horovodversionmismatcherror": 51, "host": [2, 3, 28, 39, 42, 47], "hour": 31, "how": [1, 5, 14, 17, 18, 27, 32, 34, 39, 40, 42, 44, 49, 58, 61, 63], "howev": [18, 21, 24, 28, 29, 30, 32, 54], "hpp": 11, "hs_to_tfg": 17, "hsp": 17, "html": [0, 5, 39, 42], "http": [0, 2, 5, 7, 8, 16, 21, 22, 28, 32, 34, 35, 37, 38, 39, 40, 41, 42, 45, 47, 49, 51, 52, 54, 55, 56, 57, 58, 60, 61, 62, 63], "http_proxi": [2, 3], "https_proxi": [2, 3], "hub": 34, "hurt": 33, "hutter": 25, "hvd": 51, "hvd_configur": 61, "hvd_support": 61, "hyper": [29, 31, 32], "hyperparamet": 51, "hyphen": 32, "i": [0, 4, 5, 7, 9, 11, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 30, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 47, 48, 49, 51, 52, 53, 54, 55, 56, 57, 58, 60, 61, 62, 63], "i0203": 61, "i0324": 62, "i0817": 61, "i1015": 51, "i1021": 51, "i1022": 51, "icd": [37, 42], "id": [2, 30, 34], "idea": 32, "ident": [0, 28], "identif": 28, "identifi": 39, "if_not_mobil": 34, "igc": 37, "ignor": [18, 28, 34], "ii": [18, 19, 33], "iii": [18, 19], "illustr": 32, "ilov": 25, "imag": [27, 28, 35, 41, 42, 44, 49, 54], "image_classif": [61, 62], "image_nam": [2, 3], "imagenet": 22, "imageri": 0, "img_arrays_for_acc": 54, "impact": [0, 5, 14, 18, 24, 32, 56], "implement": [4, 7, 10, 16, 17, 19, 21, 23, 25, 26, 30, 32, 35, 49, 51, 63], "import": [2, 7, 11, 14, 17, 18, 19, 22, 23, 25, 26, 27, 28, 30, 32, 35, 37, 38, 39, 40, 41, 42, 47, 49, 52, 53, 56, 63], "import_graph_def": 35, "imports_graph_def": 35, "improv": [15, 16, 19, 28, 32, 36, 39, 40, 49, 62], "inappropri": 0, "incarn": 2, "incept": [15, 18, 35, 44, 49, 54], "inceptionv4": 35, "inceptionv4_fp32_pretrained_model": [35, 47], "incid": 0, "includ": [0, 7, 13, 14, 16, 17, 18, 20, 23, 40, 42, 51, 52, 53, 63], "include_subdir": 7, "inclus": 0, "incorrect": 28, "increas": [18, 28, 52], "independ": [16, 25, 29, 35], "index": [18, 32], "indic": [24, 28, 47, 62], "individu": [0, 16, 20], "inf": 28, "infer": [11, 15, 16, 17, 18, 19, 24, 28, 34, 36, 44, 45, 51, 52, 56], "infer_config": 52, "infer_fp32_vs_amp": 47, "infer_inception_v4_amp": 47, "infer_resnet50": [29, 48], "inferlist": 18, "inferlist_add": 18, "inferlist_remov": [18, 19], "infin": 28, "influenc": [21, 29, 32], "info": [17, 18, 29, 36, 40, 45, 47, 49], "inform": [0, 1, 7, 8, 16, 20, 29, 32, 33, 39, 40, 42, 45, 52, 61, 63], "infrastructur": [4, 9, 20, 63], "init": 11, "init_checkpoint": 57, "initi": [17, 20, 28, 31, 35, 39, 40], "initial_weight": 28, "innov": [4, 63], "inplac": 7, "input": [4, 11, 13, 17, 19, 20, 21, 22, 24, 25, 28, 33, 35, 62], "input_height": 53, "input_shap": [35, 49], "input_width": 53, "input_x": 35, "insert": [18, 19, 24, 35, 52], "insid": [2, 63], "inspir": 0, "instal": [2, 3, 4, 7, 9, 14, 18, 19, 21, 22, 23, 26, 27, 28, 29, 31, 32, 33, 45, 46, 47, 48, 51, 52, 54, 55, 56, 57, 60], "install_head": 40, "instanc": [0, 31], "instance_idx": 29, "instancenorm": [19, 26], "instead": [36, 37, 39, 51, 54, 55, 60], "instruct": [2, 3, 4, 7, 16, 18, 19, 21, 31, 32, 41, 42, 54, 61, 63], "insult": 0, "int": [11, 35, 40, 51], "int8": [4, 28, 31, 45, 49, 52], "integ": 29, "integr": [4, 15, 16, 30, 32, 39], "intel": [0, 1, 5, 8, 9, 11, 14, 15, 16, 17, 18, 19, 20, 21, 22, 24, 25, 26, 28, 29, 30, 36, 38, 43, 44], "intel_extension_for_tensorflow": [11, 17, 18, 19, 25, 26, 28, 29, 34, 37, 38, 39, 41, 42, 47, 49, 63], "intel_extension_for_tensorflow_lib": [11, 39], "intel_xpu": 2, "intelai": 16, "intelpython3_ful": 38, "intend": [7, 16, 63], "intent": 7, "inter": [4, 20, 35], "inter_op_parallelism_thread": 35, "interact": [0, 39], "interfac": [17, 30, 43, 63], "intermedi": [16, 28], "intern": 16, "internet": 47, "interop": 29, "interpret": 29, "intraop": 29, "introduc": [16, 29, 32, 36], "introduct": 19, "invalid": [13, 27, 32], "invent": 15, "investig": [0, 29], "invis": 0, "invok": [16, 17], "involv": 0, "io": [5, 34], "ip": 56, "ipc": [2, 3, 42, 47], "ipp": 55, "ipykernel": 54, "ipynb": [52, 54, 56], "ipython": 56, "ir": [16, 17], "irc_na": [37, 42], "is_bf16_math_mod": 24, "is_gpu_avail": 28, "isol": [37, 41, 42], "issu": [0, 1, 4, 7, 14, 18, 28, 37, 39, 40, 42, 56, 63], "item": [22, 35], "iter": [20, 31, 35, 36, 62], "itex": [0, 2, 3, 4, 8, 9, 11, 13, 14, 17, 18, 19, 20, 21, 23, 26, 27, 28, 29, 30, 31, 34, 37, 38, 39, 40, 41, 42, 46, 47, 52, 54, 62, 63], "itex_auto_mixed_precis": [16, 18, 19, 29, 33, 47], "itex_auto_mixed_precision_allowlist_add": [18, 19], "itex_auto_mixed_precision_allowlist_remov": 18, "itex_auto_mixed_precision_clearlist_add": 18, "itex_auto_mixed_precision_clearlist_remov": 18, "itex_auto_mixed_precision_data_typ": [16, 18, 19, 47], "itex_auto_mixed_precision_denylist_add": 18, "itex_auto_mixed_precision_denylist_remov": 18, "itex_auto_mixed_precision_inferlist_add": 18, "itex_auto_mixed_precision_inferlist_remov": [18, 19], "itex_auto_mixed_precision_log_path": [18, 19, 20, 33], "itex_auto_mixed_precision_unsafe_force_al": 18, "itex_bf16": 61, "itex_bf16_lar": 61, "itex_build": [39, 40], "itex_cfg": [17, 62], "itex_check_eq": 11, "itex_cpp_min_log_level": 20, "itex_disable_xla": 27, "itex_dummy_bf16": 61, "itex_dummy_bf16_lar": 61, "itex_dummy_fp32": 61, "itex_dummy_fp32_lar": 61, "itex_enable_multiple_stream": 62, "itex_enable_nextpluggable_devic": 27, "itex_fp32": 61, "itex_fp32_lar": 61, "itex_fp32_math_mod": [20, 51], "itex_gpu_wrapp": 42, "itex_layout_opt": [29, 32, 33], "itex_layout_optitex_remapperitex_auto_mixed_precisionitex_shard": 33, "itex_omp_threadpool": [3, 4, 20, 29, 35, 40], "itex_onednn_graph": [33, 52], "itex_ops_overrid": 27, "itex_optimizer_after_shard": 17, "itex_optimizer_before_shard": 17, "itex_quant": 49, "itex_remapp": 33, "itex_repo": 47, "itex_shard": 33, "itex_sync_exec": 33, "itex_tf_constant_fold": [15, 52], "itex_tile_as_devic": 20, "itex_verbos": [11, 17], "itex_vlog": 11, "itex_xpu_librari": 11, "itex_xx": 61, "itexauto_mixed_precision_opt": [18, 19], "itexdatatyp": 33, "itexgelu": 26, "itexgelugrad": 26, "itexlayernorm": 26, "itexlayernormgrad": 26, "itexlstm": 26, "itexresourceapplyadamwithweightdecai": 26, "itexrnn": 26, "its": [4, 11, 25, 28, 29, 30, 32, 37, 42, 53], "iv": [18, 19], "jammi": [37, 39], "jax": [16, 27, 30, 63], "jemalloc": 32, "jit": [4, 16, 27, 30], "jit_compil": 27, "job": [11, 20, 40], "join": [22, 32, 35], "json": [16, 35, 57], "just": [0, 4], "k8": [3, 40], "kaim": 25, "kdstindex": 11, "keep": [28, 32], "keepdim": 35, "kei": [9, 17, 20, 36, 37, 39], "kept": [26, 28], "kera": [4, 19, 25, 26, 31, 35, 51, 52, 54, 58, 63], "keras_util": [61, 62], "kerascv": 31, "keraslay": 22, "kernel": [2, 3, 9, 10, 15, 20, 22, 23, 24, 25, 28, 30, 31, 35, 37, 39, 40, 41, 42, 51, 52, 54, 56, 63], "kernel_initi": [25, 26], "kernels_experiment": 34, "keyr": 37, "kind": [0, 4, 21, 53], "kitti": 49, "kmp": 32, "kmp_affin": [29, 32, 35], "kmp_blocktim": [29, 32, 35], "knob": 29, "know": [19, 28], "knowledg": [19, 32], "known": [16, 28, 56], "kwarg": [25, 26, 35], "l": [34, 35, 40], "l28": 34, "l2loss": 24, "l_basekit_p_2024": [37, 42], "label_shap": 49, "ladder": 0, "lake": [4, 21], "lamb": [25, 51], "lambda": 25, "languag": [0, 40], "language_model": 16, "languagemodel": 51, "laptop": 14, "lar": 61, "larg": [4, 16, 20, 25, 28, 32, 35, 36, 44], "larger": [31, 32, 35, 39, 40], "last": [28, 56], "latenc": [13, 35, 47, 54], "latency_mod": 29, "later": [32, 37, 41, 42], "latest": [8, 27, 31, 34, 38, 39, 40, 42, 63], "launch": [21, 42, 54], "launcher": [4, 29, 32], "layer": [2, 9, 16, 19, 25, 28, 35, 52], "layer_0": 20, "layernorm": [19, 24, 26], "layernormgrad": 26, "layout": [13, 29, 33, 36], "layout_opt": 33, "ld": 32, "ld_library_path": 40, "ld_preload": [29, 32], "lead": [0, 16, 18], "leader": 0, "leakyrelu": 24, "learn": [0, 14, 15, 16, 19, 21, 25, 27, 29, 32, 34, 36, 44, 45, 63], "learning_r": [25, 26, 57], "learning_rate_per_gpu": 51, "learning_rate_phase1": 51, "learning_rate_phase2": 51, "least": [28, 37, 38], "leav": 32, "legaci": [27, 30, 51, 54, 55, 56, 57, 60, 61, 62], "legal": 7, "len": 35, "length": [16, 31, 51], "less": [4, 18, 19, 21, 24, 28, 35, 47], "lessequ": 24, "let": [18, 28, 34, 35], "level": [0, 14, 16, 17, 23, 24, 28, 37], "level_zero": 14, "level_zero_util": 14, "leverag": [4, 16], "lib": [2, 14, 29, 39, 40, 56], "lib64": 29, "lib_path": 40, "libgomp": 32, "libiari": 42, "libigc1": 37, "libigdfcl1": 37, "libigdgmm12": 37, "libiomp": 32, "libiomp5": [32, 40], "libitex": 40, "libitex_common": 39, "libitex_cpu": 39, "libitex_cpu_cc": [34, 40], "libitex_gpu": 39, "libitex_gpu_cc": [34, 40], "libitex_gpu_xetla": 40, "libmkl_sycl": [14, 47, 48, 51, 54, 55, 57, 60], "libomp": 39, "librari": [2, 3, 11, 14, 16, 29, 32, 37, 39, 42, 55], "library_path": 40, "libtensorflow": 40, "libtensorflow_cc": 40, "libtensorflow_framework": 40, "like": [0, 2, 7, 17, 25, 28, 32, 33, 46, 47, 57, 58], "limit": [16, 17, 32, 63], "line": [7, 28, 32, 34, 47, 56, 62], "linear": [4, 16, 19, 21, 25, 28, 30], "linearli": 25, "link": [2, 31, 40, 52], "linkstat": 11, "linux": [2, 3, 7, 29, 31, 32, 38, 39, 40, 41, 42, 52], "list": [2, 7, 11, 16, 19, 24, 27, 28, 29, 30, 32, 35, 37, 39, 40], "list_local_devic": 2, "list_physical_devic": [14, 19, 28], "littl": 18, "live": 16, "ll": [20, 24], "lld": 39, "lldb": 39, "llga": [7, 33], "llvm": [16, 39], "llvm_openmp": 40, "ln": 40, "load": [11, 28, 34, 35, 42], "load_data": [19, 28, 35], "load_ops_librari": 11, "load_pb": 35, "load_ref_result": 54, "local": [2, 3, 7, 14, 19, 29, 31, 32, 34, 35, 39, 40, 41, 42, 49, 58], "localalloc": 29, "localhost": [5, 11, 20, 41, 42], "locat": [7, 8, 39, 40, 51, 54], "lock": 13, "log": [7, 11, 18, 20, 22, 28, 33, 35, 40, 42, 47, 48, 51, 54, 55, 56, 57, 58, 60, 62], "log_everi": [55, 60], "log_file_prefix": 29, "log_path": 29, "log_step": 62, "log_warmup_step": 60, "logdir": 22, "logic": 32, "logit": 35, "logpath": 22, "long": [25, 30], "look": [2, 24, 34, 39, 40], "loop": [54, 62], "loshch": 25, "loss": [15, 18, 19, 31, 35, 44, 45, 52, 58], "loss_object": 28, "loss_scal": 28, "lossscaleoptim": 28, "low": [4, 16, 18, 21, 23, 28, 45], "lower": [4, 15, 18, 19, 21, 35, 47], "lowpropos": 49, "lr": [25, 51, 58], "lscpu": [32, 52], "lstm": 25, "lt": [31, 33, 37], "ltensorflow_cc": 40, "ltensorflow_framework": 40, "m": [5, 29, 32, 45, 46, 49, 54, 55, 58, 60], "m150": [39, 40], "m75": [39, 40], "machin": [2, 3, 14, 16, 21, 28, 29, 32, 34, 41, 42, 53, 58], "macro": 11, "made": [11, 30, 55], "mai": [0, 7, 13, 14, 16, 18, 19, 24, 28, 29, 32, 35, 36, 37, 38, 42, 54, 63], "mail": 0, "main": [5, 17, 21, 37, 39, 40, 55, 58, 60, 61], "mainli": [15, 17, 29], "maintain": [0, 7, 8, 14, 18, 21, 23, 25, 34, 36], "make": [0, 2, 3, 5, 7, 11, 16, 18, 19, 28, 30, 32, 35, 36, 39, 40, 47], "makefil": 40, "malloc": [29, 32], "malloc_conf": 29, "man": 32, "manag": 63, "mani": [16, 18, 21, 28, 29, 32, 58], "manner": 16, "manual": [5, 7, 18, 28, 29, 51, 61], "manylinux2014": [37, 41, 42], "manylinux2014_x86_64": 40, "manylinux_2_17_x86_64": 40, "map_structur": 35, "mark": 17, "mask": [25, 44], "maskrcnn": 60, "master": [32, 34, 36], "match": [16, 29, 36, 43], "matcher": 24, "math": [20, 24, 28, 37, 42], "matmul": [17, 20, 24, 26, 35, 36, 40, 49], "matrix": [36, 40], "max": [16, 33, 39, 40, 42, 47, 50, 51, 54, 55, 56, 57, 58, 60, 61, 62, 63], "max_seq_length": 57, "max_step": 55, "maxim": [4, 17, 21, 25, 33, 62], "maximum": [31, 51], "maxpool": 49, "maxpool3d": 24, "maxval": 35, "md": 21, "mean": [13, 14, 18, 25, 27, 28, 29, 32, 35, 36, 39, 40], "mechan": [4, 16, 21, 30], "media": 0, "medic": 44, "meet": [3, 25, 51, 63], "member": [0, 33], "membind": 32, "memori": [4, 9, 11, 13, 14, 15, 16, 18, 19, 21, 25, 28, 31, 36, 47, 51], "memory_limit": 2, "mention": [28, 32], "merg": 5, "messag": [28, 29], "meta": 13, "metadata_thp": 29, "metal": 44, "method": [28, 32, 45, 52], "metric": [19, 28, 35], "middl": 28, "might": [11, 39], "migrat": 7, "millisecond": 32, "mind": 16, "miniconda": 38, "miniconda3": 38, "minim": [15, 32], "minimum": [31, 39], "minor": [4, 21, 23], "minut": [25, 39, 40], "minval": 35, "miscellan": 9, "mismatch": 28, "miss": 15, "mistak": 0, "mit": 52, "mix": [4, 31, 33, 35, 44, 49], "mixed_bfloat16": 28, "mixed_float16": 28, "mixed_precis": 28, "mkdir": [2, 3, 39, 61, 62], "mkl": [7, 34, 37, 38, 39, 40, 42], "ml": 16, "mlir": 17, "mnist": [19, 28, 34, 35, 44, 58], "mnist_client": 34, "mnist_saved_model": 34, "mode": [16, 17, 20, 24, 31, 33, 39, 51, 54, 61], "model": [2, 3, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 27, 32, 33, 35, 36, 44, 45, 52, 56, 58, 62, 63], "model_base_path": 34, "model_dir": [3, 34, 55, 60, 61, 62], "model_nam": [3, 34], "model_path": 49, "model_serv": [3, 34], "model_training_util": 51, "model_typ": 61, "modelserv": 34, "moder": 0, "modern": 36, "modif": [4, 16, 30], "modifi": [5, 35, 40, 47, 51, 62], "modul": [14, 17, 29], "modular": 10, "modulenotfounderror": 14, "monitor": 14, "monolith": 16, "more": [1, 4, 7, 11, 16, 18, 19, 21, 25, 32, 34, 35, 36, 37, 39, 40, 42, 45, 51, 52, 53, 58, 61], "most": [4, 18, 19, 28, 29, 32, 47, 56], "mount": [2, 3], "move": [18, 32, 51, 55, 60], "mozilla": 0, "mpi": [37, 38, 42], "mpirun": [55, 58, 60, 61], "mrpc": 16, "mt": 31, "much": [28, 32, 35, 52], "mul": 24, "multi": [28, 32, 33, 38, 39, 51, 60, 62], "multipl": [18, 20, 32, 36, 62], "multipli": 28, "must": [5, 15, 27, 28, 35], "mutex": 13, "mutual": 29, "my": [14, 18, 19], "mybuilddir": 39, "myfil": 7, "n": [18, 24, 25, 32, 33, 38, 39, 40, 51, 53], "n02123159": 48, "na": [27, 31], "name": [2, 3, 5, 7, 11, 14, 18, 19, 20, 25, 26, 28, 30, 32, 34, 35, 44, 49, 54, 58], "name_scop": 11, "namespac": [4, 17, 21, 23, 25, 26, 33, 40], "nan": 28, "narrow": 28, "nation": 0, "nativ": [4, 15, 16, 21], "natur": 0, "ncdhw": 24, "nchw": 32, "ncore_per_inst": 29, "ndhwc": 24, "necessari": [16, 28, 37, 41, 42, 53], "necessarili": 16, "need": [4, 8, 13, 14, 16, 17, 20, 21, 23, 28, 29, 30, 34, 35, 36, 37, 38, 39, 40, 42, 47, 52, 53, 56, 60, 61, 62], "neg": [32, 35], "neglig": 28, "neither": 29, "nest": 35, "netron": 18, "network": [14, 15, 32], "neural": [4, 14, 15, 21, 32, 44, 45, 52], "new": [4, 5, 7, 8, 15, 16, 21, 23, 24, 28, 30, 32, 36, 45, 51], "newer": [15, 45, 46, 52], "newrootscop": 40, "next": [4, 16, 28, 39, 49], "next_pluggable_devic": 30, "next_pluggable_device_factori": 30, "nextplugg": 30, "nextpluggabledevic": 16, "nhwc": [20, 32], "nibabel": 55, "nic": 31, "nice": 32, "nifti": 55, "nightli": 55, "ninstanc": 29, "nn": [11, 25, 26, 33, 35, 53], "nn_op": 11, "no_proxi": [2, 3], "no_python": 29, "node": [13, 18, 20, 24, 32, 36, 38, 45, 51], "node0": 32, "node1": 32, "node_id": 29, "nolint": 7, "nolintnextlin": 7, "non": [27, 35], "none": [8, 25, 26, 28, 29, 33, 51], "nonetyp": 56, "nonlinear": 25, "nor": 29, "norm": 25, "normal": [17, 20, 25, 28, 32, 39, 47], "note": [2, 3, 5, 11, 16, 17, 18, 20, 25, 27, 28, 29, 31, 33, 34, 36, 39, 40, 47, 49, 51, 54, 58, 60, 61], "notequ": 24, "notfounderror": [14, 47, 48, 51, 54, 55, 57, 60], "noth": 11, "notic": [13, 28], "novel": 16, "now": [2, 18, 28, 32, 34], "np": [22, 25, 53, 55, 58, 60, 61], "npd": [4, 27, 30], "npz": 28, "nth": 32, "nullptr": 11, "num": [29, 32, 51], "num_accumulation_steps_phase1": 51, "num_accumulation_steps_phase2": 51, "num_channel": 53, "num_class": 35, "num_el": 11, "num_gpu": [51, 62], "num_test": 34, "num_train_epoch": 57, "num_unit": [19, 28], "numa": 31, "numactl": [29, 35], "number": [15, 20, 24, 28, 31, 32, 35, 36, 44, 45, 51, 54, 61, 62], "number_of_process": 61, "numer": 28, "numpi": [22, 25, 28, 53, 55], "nv_result": 54, "nvidia": [28, 51, 54, 55, 60], "nvme": 31, "o": [2, 22, 27, 31, 35, 37, 38, 39, 40, 42, 44, 52], "oam": 31, "object": [12, 14, 18, 28, 32, 33, 47, 48, 49, 51, 54, 55, 56, 57, 60], "oblig": 0, "obvious": 18, "occasionali": 27, "occupi": 18, "occur": 28, "ocl": 11, "ocloc": [39, 40], "off": [13, 29, 31, 33, 52, 62, 63], "offcial": 11, "offens": 0, "offer": [19, 30, 32, 49], "offici": [0, 16, 32, 44, 45, 46, 51, 54, 55, 57, 60, 61, 62], "offlin": [0, 36, 39, 40], "offononoffoff": 33, "often": [29, 37, 41, 42], "ok": 51, "omp": [4, 20, 32, 35], "omp_num_thread": [29, 35], "omp_proc_bind": 32, "omp_schedul": 32, "onboard": 32, "onc": [20, 28, 32, 36], "onconfig": [18, 19], "one": [11, 15, 20, 21, 28, 32, 39, 40, 47, 53, 55, 61], "oneapi": [2, 14, 21, 31, 34, 38, 45, 47, 48, 51, 52, 54, 55, 56, 57, 60, 61, 62, 63], "oneapi_install_path": 34, "oneccl": [2, 37, 38, 42, 51], "onednn": [9, 11, 12, 14, 15, 20, 24, 32, 33, 36, 44], "onednn_cpu_git_vers": 33, "onednn_engin": 11, "onednn_gpu_git_vers": 33, "onednn_graph": 33, "onednn_graphoverrid": 33, "onednn_stream": 11, "onednn_verbos": 11, "onednngraph": 15, "onemkl": [37, 38, 39, 40, 42], "ones": [22, 25, 26, 33, 51], "onli": [2, 4, 5, 13, 14, 16, 17, 18, 20, 21, 23, 24, 28, 29, 30, 33, 34, 36, 37, 41, 51, 54, 55, 56, 57, 60, 61, 62], "onlin": [0, 31, 63], "op": [4, 9, 10, 16, 17, 20, 21, 23, 24, 26, 27, 28, 30, 35, 40, 49, 51, 54], "op_build": 11, "op_kernel": 11, "op_requires_ok": 11, "opaqu": 30, "open": [0, 5, 7, 14, 16, 18, 21, 34, 35, 37, 47, 48, 51, 52, 54, 55, 56, 57, 60, 63], "opencl": [14, 37, 39, 40, 42], "opencv": [49, 60], "openmp": [29, 39], "openvino": 49, "openxla": 4, "openxla_support_on_gpu": 21, "oper": [4, 13, 15, 16, 18, 23, 24, 28, 32, 35, 36, 63], "opinion": 0, "opkernel": 11, "opkernelconstruct": 11, "opkernelcontext": 11, "ops_overrid": 27, "opt": [2, 3, 11, 14, 37, 39, 40, 42, 46, 58], "optim": [2, 4, 9, 14, 15, 16, 17, 18, 23, 25, 26, 28, 29, 30, 31, 32, 33, 35, 36, 37, 38, 42, 44, 45, 47, 49, 50, 51, 52, 54, 55, 60, 61, 63], "option": [2, 3, 7, 11, 18, 21, 29, 33, 35, 61, 62, 63], "order": [18, 19, 28, 29, 30, 32, 38, 43], "org": [0, 2, 7, 21, 39, 40, 49, 56], "organ": 16, "orient": 0, "origin": [4, 16, 18, 21, 23, 24, 25, 31, 36, 40, 45, 47, 49, 56], "orign": 31, "orthogon": [25, 26], "other": [0, 17, 20, 25, 28, 29, 30, 31, 32, 33, 34, 35, 37, 39, 40, 42, 56, 58, 63], "otherwis": [0, 17, 28, 33, 52, 53], "our": 29, "out": [3, 15, 28, 36, 40, 48, 51, 53, 54, 62], "outcom": 54, "outermost": 25, "output": [2, 7, 11, 13, 16, 19, 20, 24, 25, 28, 30, 31, 33, 35, 37, 39, 40, 47, 49, 52, 57], "output_dim": 35, "output_dir": [16, 55, 57, 60], "over": [18, 28, 49], "overal": [0, 32], "overhead": [13, 16, 28, 32, 35, 51], "overload": 26, "overrid": [4, 11, 18, 27, 28], "oversize_threshold": 29, "overview": 4, "own": [35, 49], "p": [2, 3, 25, 34, 41, 42, 47, 61], "pacakg": 56, "packag": [3, 27, 30, 32, 37, 38, 39, 41, 45, 51, 52, 55, 56, 60, 63], "pad": [24, 25, 53], "page": [5, 21, 22, 23, 32, 63], "paintbucket": 18, "parallel": [13, 20, 32, 35, 39], "paramet": [17, 26, 35, 47, 51], "parent": 9, "parsefromstr": 35, "part": [15, 16, 17, 32, 39, 40, 51, 60], "parti": [9, 36, 63], "particip": 0, "particular": 28, "particularli": 14, "partit": [15, 32], "pass": [11, 15, 16, 17, 28, 31, 33, 36, 49, 54, 62], "patch": [7, 34, 51, 54, 55, 57, 60, 62], "path": [2, 3, 7, 16, 18, 19, 20, 22, 29, 32, 33, 34, 37, 38, 39, 40, 42, 47, 49, 51, 52, 55, 57, 60, 61, 62], "path_to_itex": 3, "path_to_libitex_cpu_cc": 34, "path_to_libitex_gpu_cc": 34, "path_to_python_unit_test": 7, "path_to_site_packag": [37, 38, 42, 63], "path_to_tensorflow_serv": 3, "pattern": [0, 4, 15, 16, 21, 24], "pb": [18, 19, 34, 35, 47, 49], "pb_file": 35, "pbtxt": 17, "pci": [2, 30], "pcie": 31, "pdf": 25, "peak": [18, 23], "penal": 32, "peopl": 0, "per": [17, 28, 29, 31, 32, 38, 58, 62], "perf": 27, "perform": [4, 14, 15, 16, 17, 19, 20, 21, 22, 23, 24, 25, 28, 29, 32, 33, 35, 36, 39, 40, 44, 49, 51, 52, 54, 55, 60, 62, 63], "period": [0, 32], "permiss": [0, 5], "person": 0, "perspect": [29, 32], "phase": [15, 31, 36, 51], "phase1": [31, 51], "phase2": 51, "phase_2": 51, "photo": 52, "physic": [0, 30, 32, 62], "physical_devic": [14, 58], "physical_device_desc": 2, "physicaldevic": [14, 58], "pick": 7, "picker": 5, "piecewiseconstantdecai": 25, "pip": [7, 11, 14, 22, 27, 33, 34, 37, 38, 39, 40, 41, 42, 45, 46, 49, 51, 54, 55, 58, 60, 62, 63], "pip3": 41, "pip_packag": [11, 39], "pip_set_env": [51, 52, 54, 55, 57, 60, 61], "pipelin": [16, 44, 45, 52], "pjrt": [4, 16, 21, 63], "place": [4, 17, 21, 32, 40], "placement": [29, 32], "plai": 32, "plain": 36, "platform": [14, 16, 28, 32, 33, 37, 39, 40, 41, 51, 54, 55, 56, 57, 60, 61, 62], "platinum": [31, 32, 35], "pleas": [7, 11, 14, 16, 17, 21, 27, 28, 37, 39, 40, 42, 44, 45, 47, 51, 53, 55, 57, 58, 60, 61, 63], "plu": [16, 32], "plug": [34, 63], "pluggabl": [4, 10, 16, 30, 40], "pluggable_devic": 30, "pluggable_device_factori": 30, "pluggabledevic": [10, 27, 63], "plugin": [4, 10, 16, 18, 19, 21, 22, 34, 39, 58, 63], "po": 35, "point": [17, 18, 20, 28, 33, 37, 42, 47], "polici": [29, 32, 63], "polit": 0, "polymorph": 11, "pool": 4, "popular": [15, 16, 31], "port": [34, 54], "portabl": [16, 36], "posit": [0, 7], "possibl": [4, 19, 32, 35, 36, 39], "post": [0, 7, 18, 19, 24, 33], "post1": 40, "potenti": [28, 63], "power": [19, 63], "ppn": [55, 58, 60, 61], "pr": 5, "practic": [4, 28, 29], "pramet": 62, "pre": [18, 31, 33, 41, 42, 51, 56], "precis": [4, 16, 30, 31, 33, 44, 45, 49, 54, 57], "preconfigur": 39, "predict": [19, 26, 27, 28, 35, 57], "predict_batch_s": 16, "predict_fil": 57, "prefer": [29, 37, 41, 42], "prefix": 29, "preload": 32, "preop": 18, "prepack": 4, "prepend": [29, 55, 58, 60, 61], "preprocess": 60, "preprocess_data": 55, "present": [30, 54], "preserv": 20, "press": 38, "pretrain": [31, 44, 49], "pretrain_bert": 51, "pretrain_lamb": 51, "pretrain_path": 51, "pretrain_result_dir": 51, "prevent": 28, "previou": [8, 25, 32, 51], "previous": [28, 30], "primari": [17, 32], "primit": [11, 13, 20, 36], "primitive_attr": 11, "primitive_desc": 11, "principl": 18, "print": [2, 11, 19, 22, 25, 28, 29, 30, 33, 35, 37, 38, 39, 40, 41, 42, 47, 48, 51, 53, 54, 62, 63], "print_graph": 35, "printf": 51, "priorit": 18, "prioriti": [20, 33], "privaci": 0, "privat": 0, "privileg": [2, 3, 47], "problem": [14, 24, 28, 32, 56], "proc": [28, 32], "procedur": [11, 37, 41, 42], "process": [4, 7, 11, 16, 21, 28, 29, 32, 34, 51, 52], "process_per_nod": 61, "processor": [4, 21, 31, 32, 41, 47, 52, 53], "proclist": 32, "produc": 57, "product": [5, 7, 21, 34, 37], "profession": 0, "profil": [4, 9, 28, 30, 32], "profiler_demo": 22, "program": [9, 27, 32, 63], "project": [2, 5, 7, 16, 63], "prolong": [39, 40], "promot": 7, "prompt": [31, 39, 40], "promptli": 0, "prop_kind": 11, "propag": [9, 13, 16, 17], "properli": [21, 29], "properti": [17, 18, 28], "propos": [7, 25], "protect": 11, "protobuf": 52, "protocol": 49, "protocolmessag": 33, "provid": [0, 2, 4, 7, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 28, 29, 30, 31, 32, 33, 35, 36, 37, 38, 39, 40, 42, 44, 45, 49, 51, 52, 55, 60, 61, 62, 63], "proxi": 36, "prune": 35, "pseudocod": 28, "pub": 37, "public": [0, 4, 5, 11, 21, 25, 33, 34], "publish": [0, 5], "pull": [7, 34, 41, 42, 47], "pure": 31, "push": [5, 16], "put": 34, "pvc": [39, 40, 51], "pwd": [47, 62], "py": [7, 11, 16, 22, 29, 34, 35, 42, 47, 48, 49, 51, 54, 55, 56, 57, 58, 60, 61, 62], "pybind11": 60, "pycocotool": 60, "pylint": 7, "pylintrc": 7, "pypi": [2, 43, 63], "python": [2, 4, 9, 14, 19, 22, 23, 25, 26, 27, 28, 29, 30, 32, 34, 35, 37, 38, 39, 41, 42, 45, 46, 49, 51, 52, 53, 55, 56, 57, 58, 60, 61, 63], "python3": [2, 5, 16, 38, 39, 54, 56], "pythonhost": 40, "pythonpath": 61, "pytorch": [27, 30], "q1": 14, "q_model": 49, "qdq": 52, "qo": 37, "qualiti": 28, "quantiz": [4, 44], "quantizev2": 49, "queri": 28, "question": [0, 4, 36, 63], "queue": [35, 62], "quick": [4, 11, 37, 44], "quickli": [20, 28], "r": [3, 7, 14, 28, 31, 32, 44, 62], "r2": [34, 40, 62], "race": 0, "rais": 33, "rand": 53, "random": [25, 35, 53], "randomnorm": 40, "rang": [25, 28, 32, 35], "rank": [31, 55, 58, 60, 61], "rapid": [41, 47], "rare": 28, "rate": [14, 15, 18, 25, 34], "rather": 25, "ratio": 36, "raw": 58, "rb": 35, "rcfile": 7, "rcnn": 49, "re": [2, 32, 35, 46], "reach": 18, "read": [20, 28, 35, 45, 55], "readm": 61, "real": [15, 28, 36, 51, 61], "reason": [0, 28, 30], "recent": 56, "recogn": [44, 45], "recommend": [16, 20, 28, 32, 33, 34, 35, 37, 38, 39, 41, 42, 46, 52], "record": [36, 61], "recurrent_activ": [25, 26], "recurrent_initi": [25, 26], "recurs": 7, "red": 42, "reduc": [15, 16, 18, 28, 32, 36, 39, 40, 45, 51, 54, 62], "reduce_mean": 35, "ref_result_dir": 54, "refer": [2, 3, 7, 11, 14, 15, 17, 18, 19, 20, 21, 23, 28, 31, 32, 33, 34, 37, 39, 40, 42, 44, 45, 46, 47, 48, 50, 51, 52, 53, 54, 55, 56, 57, 58, 60, 61, 62, 63], "refresh": 22, "regardless": 0, "region": 32, "regist": [4, 14, 30, 45, 52], "register_": 11, "register_geluop": 11, "register_kernel_build": 11, "registr": [10, 11, 55], "registrationcent": [37, 42], "regress": 27, "regular": [25, 36], "reinstal": 51, "reject": 0, "rel": [16, 29, 51], "relat": [5, 27, 29, 34, 36], "relationship": [14, 18], "releas": [4, 14, 17, 32, 33, 34, 39, 40, 45, 54, 56], "reli": 17, "relianc": 16, "religion": 0, "relu": [4, 11, 19, 21, 24, 25, 26, 28, 35, 53], "relu6": 24, "relu_op": 11, "relu_op_functor": 11, "relubaseop": 11, "relugrad": 24, "remain": [20, 30], "remapp": [19, 24, 33], "remot": 32, "remov": [0, 11, 16, 18, 24], "reorder": [13, 36], "repeat": 18, "replac": [14, 25, 26, 27, 34, 36, 40, 51], "replica": [11, 20], "repo": [5, 31, 37, 38], "report": [0, 7, 20, 63], "repositori": [9, 16, 31, 37, 51, 55, 60], "repres": [0, 4, 16, 17, 30, 31], "represent": 15, "representative_dataset": 49, "reproduc": 31, "request": [0, 7, 63], "requir": [2, 4, 7, 11, 13, 15, 16, 21, 22, 24, 25, 28, 29, 30, 36, 38, 45], "rerun": 28, "research": 57, "reserv": 32, "reset": 54, "reshap": [19, 25, 28, 35], "resnet": [61, 62], "resnet101": 49, "resnet34": 49, "resnet50": [17, 29, 31, 44, 49, 59], "resnet50_itex": 62, "resnet_ctl_imagenet_main": 62, "resnet_v1_50": 22, "resolv": 1, "resourc": [29, 32, 56], "respect": [0, 29, 35, 51], "rest": [20, 24], "rest_api_port": 34, "restart": 38, "result": [5, 15, 16, 17, 19, 22, 27, 28, 30, 32, 33, 38, 45, 48, 53, 54, 56, 62], "result_dir": 51, "retinanet50": 49, "retrain": 28, "retriev": [28, 49], "return": [11, 17, 28, 30, 33, 35, 40], "return_sequ": 25, "return_st": 25, "reus": [32, 45], "review": 0, "rewrit": [11, 17], "rewrite_opt": 52, "rewriter_config_pb2": 52, "rewriterconfig": 52, "rewritten": 16, "rf": [34, 46, 61], "rfc": [7, 21], "right": [0, 25], "rm": [34, 40, 46, 47, 61], "rmsprop": [19, 28, 35], "role": 32, "root": [7, 39, 40, 56], "rpath": 40, "rule": 19, "run": [7, 11, 14, 16, 18, 19, 22, 24, 26, 27, 28, 29, 31, 32, 33, 35, 39, 41, 42, 63], "run_20210712212258_inst": 29, "run_20210712212258_instance_0_cores_0": 29, "run_20221009103552_inst": 29, "run_20221009103552_instance_0_cores_0": 29, "run_20221009104740_inst": 29, "run_20221009104740_instance_0_cores_0": 29, "run_20221009105044_inst": 29, "run_20221009105044_instance_0_cores_12": 29, "run_20221009105320_inst": 29, "run_20221009105320_instance_0_cores_0": 29, "run_20221009105838_inst": 29, "run_20221009105838_instance_0_cores_0": 29, "run_20221009105838_instance_1_cores_12": 29, "run_20221009105838_instance_2_cores_24": 29, "run_20221009105838_instance_3_cores_36": 29, "run_20221009105838_instance_4_cores_48": 29, "run_20221009105838_instance_5_cores_60": 29, "run_20221009105838_instance_6_cores_72": 29, "run_20221009105838_instance_7_cores_84": 29, "run_20221009110327_inst": 29, "run_20221009110327_instance_0_cores_0": 29, "run_20221009110327_instance_10_cores_40": 29, "run_20221009110327_instance_11_cores_44": 29, "run_20221009110327_instance_12_cores_48": 29, "run_20221009110327_instance_13_cores_52": 29, "run_20221009110327_instance_14_cores_56": 29, "run_20221009110327_instance_15_cores_60": 29, "run_20221009110327_instance_16_cores_64": 29, "run_20221009110327_instance_17_cores_68": 29, "run_20221009110327_instance_18_cores_72": 29, "run_20221009110327_instance_19_cores_76": 29, "run_20221009110327_instance_1_cores_4": 29, "run_20221009110327_instance_20_cores_80": 29, "run_20221009110327_instance_21_cores_84": 29, "run_20221009110327_instance_22_cores_88": 29, "run_20221009110327_instance_23_cores_92": 29, "run_20221009110327_instance_2_cores_8": 29, "run_20221009110327_instance_3_cores_12": 29, "run_20221009110327_instance_4_cores_16": 29, "run_20221009110327_instance_5_cores_20": 29, "run_20221009110327_instance_6_cores_24": 29, "run_20221009110327_instance_7_cores_28": 29, "run_20221009110327_instance_8_cores_32": 29, "run_20221009110327_instance_9_cores_36": 29, "run_20221009110849_inst": 29, "run_20221009110849_instance_0_cores_0": 29, "run_20221009110849_instance_1_cores_11": 29, "run_20221009110849_instance_1_cores_24": 29, "run_20221009110849_instance_2_cores_22": 29, "run_20221009110849_instance_2_cores_48": 29, "run_20221009110849_instance_3_cores_33": 29, "run_20221009110849_instance_3_cores_72": 29, "run_20221009111034_instance_0_cores_0": 29, "run_20221009111239_instance_0_cores_24": 29, "run_20221009111753_inst": 29, "run_20221009111753_instance_0_cores_0": 29, "run_20221009111951_inst": 29, "run_20221009111951_instance_0_cores_0": 29, "run_20221009112720_instance_0_cores_0": 29, "run_20221009112905_instance_0_cores_0": 29, "run_20221009112956_instance_0_cores_0": 29, "run_classifi": 16, "run_inf": 35, "run_jupyt": 52, "run_pretraining_lamb": 51, "run_squad": [51, 57], "runner": 61, "runtim": [16, 18, 23, 25, 27, 28, 32, 36, 37, 39, 40, 51, 63], "safe": [13, 18, 33, 63], "sai": [28, 51], "same": [5, 7, 14, 20, 21, 23, 24, 25, 28, 29, 30, 31, 32, 33, 34, 35, 36, 39, 40, 45, 53], "sampl": [2, 22, 31, 35, 45, 52, 54], "samsung": 31, "saniti": [7, 63], "sapphir": [41, 47], "satisfi": [13, 23], "save": [5, 11, 17, 29, 33, 49, 57], "save_checkpoint_step": 51, "save_json_data": 35, "saved_model": 34, "savedmodel": 49, "scalabl": [4, 21, 31, 34, 41, 47], "scale": [4, 25, 26, 31, 35, 62], "scaled_gradi": 28, "scaled_loss": 28, "scenario": [4, 13, 20, 21, 23, 32, 33], "schedul": [13, 16, 25, 29, 32, 35], "schmidhub": 25, "scope": [17, 40], "scratch": [28, 51], "scratchpad": [11, 13], "scratchpad_mem": 11, "scratchpad_mod": 11, "screen": 47, "script": [5, 21, 22, 27, 32, 39, 40, 42, 47, 49, 51, 53, 55, 56, 60, 61], "sdp": 29, "seamless": [4, 30], "search": [7, 29], "sec": [31, 35, 51, 62], "second": [32, 35, 52, 61, 62], "section": [14, 28, 32, 37, 39, 40, 49], "secur": 0, "see": [0, 1, 2, 4, 7, 14, 16, 22, 25, 28, 29, 32, 34, 36, 37, 39, 52, 61, 63], "seed": 60, "seen": 32, "segment": [31, 44, 60], "select": [14, 28, 29, 30, 33, 54, 63], "self": 35, "semant": [17, 20, 25], "send": 16, "separ": [11, 14, 23, 24, 28, 31, 32, 38, 39, 63], "seq": 16, "sequenc": [31, 51, 54], "sequenti": 35, "seri": [0, 16, 32, 33, 39, 40, 42, 45, 47, 50, 51, 52, 54, 55, 56, 57, 58, 60, 61, 62, 63], "serial": 35, "seriesintel": 47, "seriesne": 47, "seriessupport": 47, "seriou": 0, "serv": [4, 30], "serval": 27, "server": [5, 31, 39, 40, 42], "servic": 55, "serving_plugin": 34, "session": [40, 52], "set": [0, 2, 4, 7, 11, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 27, 31, 32, 33, 35, 37, 38, 40, 42, 47, 51, 52, 57, 63], "set_config": [17, 18, 19, 47, 62], "set_env_cpu": [47, 48, 56], "set_env_gpu": [47, 48, 56], "set_global_polici": 28, "set_log_device_plac": 22, "set_scratchpad_mod": 11, "set_sess": 52, "set_weight": 28, "setup": [38, 41, 43, 45], "setvar": [14, 37, 42, 46, 58], "sever": [4, 16, 21, 29, 31, 32, 39, 40, 44, 61], "sex": 0, "sexual": 0, "sh": [2, 3, 5, 14, 34, 37, 38, 39, 40, 42, 46, 47, 48, 51, 52, 54, 55, 56, 57, 58, 60, 61, 63], "shape": [11, 13, 16, 17, 19, 25, 28, 30, 35, 36, 53], "shard": [4, 17, 21, 33], "sharding_config": [17, 62], "shardingconfig": [17, 62], "share": [7, 14, 32, 37, 47, 48, 51, 54, 55, 57, 60], "short": [16, 25, 28], "shoul": 40, "should": [2, 3, 5, 7, 22, 27, 28, 32, 34, 35, 37, 38, 40, 41, 42, 45, 51, 57, 62], "show": [5, 14, 16, 18, 27, 28, 31, 35, 39, 40, 42, 44, 45, 47, 49, 50, 51, 52, 54, 55, 56, 57, 60, 61, 62], "showcas": [16, 31], "shown": [2, 3, 15, 22, 24, 29, 51, 54, 55, 60], "shuffl": 28, "sigmoid": [24, 25, 26], "sign": [25, 37], "signific": [4, 7, 18], "significantli": [4, 28], "signoff": 51, "similar": [19, 32], "simpl": [4, 21, 23, 28, 40], "simpli": [28, 30, 62], "simplifi": 45, "simultan": [31, 42], "sinc": [4, 14, 28, 32, 36, 42], "singl": [0, 4, 7, 15, 20, 21, 24, 31, 51, 60, 61], "single_l2_loss_op": 62, "site": [5, 8, 37, 38, 39, 42, 56, 63], "situat": [20, 33], "size": [0, 20, 25, 28, 29, 31, 51, 58, 62], "skip": [7, 28, 29, 38], "skip_cross_node_cor": 29, "skip_ev": 62, "sle": 42, "sleep": 32, "slowdown": 16, "slower": [18, 19, 28, 35], "slowli": 28, "small": [13, 25, 28, 29, 32, 35], "sn850x": 31, "snapshot": 39, "snippet": 61, "so": [14, 16, 19, 28, 29, 32, 33, 34, 39, 40, 47, 48, 51, 54, 55, 56, 57, 58, 60], "social": 0, "socio": 0, "socket": [31, 32, 38, 62], "softmax": [18, 19, 28], "softwar": [2, 16, 38, 43, 45, 52, 53, 58], "sole": 32, "solut": [4, 14, 15, 21, 27, 30], "solv": [28, 56], "some": [2, 11, 18, 19, 26, 28, 29, 32, 39, 40, 49, 51, 58], "sometim": 7, "sort": [0, 16], "sourc": [2, 3, 4, 7, 11, 16, 17, 21, 37, 38, 42, 43, 46, 47, 48, 52, 55, 56, 58, 60, 63], "sp4": [31, 42], "sp5": 42, "space": [0, 32, 63], "sparse_categorical_crossentropi": [19, 28], "sparsecategoricalaccuraci": [28, 35], "sparsecategoricalcrossentropi": [28, 35], "special": [16, 19, 23, 28, 39, 40], "specif": [4, 16, 28, 30, 32, 33, 34, 37, 42, 61, 63], "specifi": [0, 3, 11, 21, 24, 28, 29, 32, 34, 39, 40, 49], "sped": 28, "speed": [15, 16, 18, 32, 44, 45], "speedup": [16, 31, 52, 62], "spend": 28, "split": [17, 18, 35], "squad": [31, 51, 57], "squad_dir": 57, "squad_vers": 51, "src": [7, 11, 14, 17, 34, 39], "src_md": 11, "src_mem": 11, "src_tensor": 11, "ssd": [31, 49], "ssdsc2kg960g8": 31, "st": [3, 40], "stabil": [19, 28], "stabl": [25, 28, 44, 63], "stable_diffusion_accuraci": 54, "stable_diffusion_infer": 54, "stable_diffussion_infer": 54, "stablehlo": 16, "stack": [31, 42, 43], "stage": [16, 52], "stage_num": [17, 62], "stall": 32, "standard": [7, 25], "standard_op": 40, "start": [2, 3, 14, 21, 22, 28, 29, 34, 35, 63], "startup": [39, 40], "stat": 22, "static": 32, "statist": 49, "statu": [0, 11, 19, 40], "status_msg": 40, "statusuniqueptr": 11, "std": [11, 40], "stdout": [7, 29], "steal": 35, "step": [3, 16, 17, 18, 25, 28, 31, 32, 34, 36, 44, 45, 51, 55, 58, 60, 62], "steps_per_epoch": [35, 60], "steps_per_loop": 62, "still": 28, "stock": [14, 16, 23, 24, 28, 30, 37, 38, 41, 42, 45, 49, 51, 54, 55, 56, 57, 60, 61, 62, 63], "stop": [22, 32], "storag": [16, 28, 31, 35, 47, 49, 56], "store": 36, "strategi": 32, "stream": [13, 27, 54, 62], "stream_executor": 28, "streamexecutor": [10, 30], "streamlin": [4, 21, 34], "strictli": 25, "stride": 53, "string": [18, 28, 29, 39, 40], "stringop": 34, "strong": 18, "structur": [4, 19, 29, 32], "sub": [9, 14, 18, 19, 32, 33], "subgraph": [15, 16], "submit": [5, 7, 63], "subsequ": [18, 19, 28, 32, 54], "subystem": 37, "succe": 36, "success": [48, 53, 54, 62], "successfulli": [14, 34, 38, 39, 40, 42, 62], "sudo": [7, 34, 37, 39, 40, 42], "suffici": [28, 35], "suggest": [56, 62], "sum": 35, "summari": [51, 63], "super": 35, "suppli": 35, "support": [4, 7, 13, 14, 15, 16, 17, 18, 19, 22, 24, 27, 28, 29, 30, 32, 33, 37, 39, 40, 41, 42, 45, 47, 52, 61, 62], "suppos": [32, 51], "sure": [3, 11, 28, 35, 37, 39, 40], "suse": [31, 42], "sustain": 0, "sw": 37, "swish": [19, 24], "switch": [4, 5, 27, 32, 35, 39], "sy": 53, "sycl": 14, "sycl_runtim": [14, 28], "symbol": 40, "sync": 33, "system": [14, 21, 30, 31, 32, 34, 35, 38, 39, 40, 56], "t": [2, 5, 11, 13, 17, 18, 20, 28, 29, 31, 36, 49, 54, 56], "tab": 22, "tabl": [18, 28, 29, 30, 31, 49], "tag": 5, "take": [0, 11, 16, 24, 28, 29, 32, 34, 35, 38, 51], "tanh": [24, 25, 26], "tape": 28, "tar": [3, 7, 32, 49], "target": [3, 16, 17, 39, 40], "task": [11, 20, 32, 61], "task_nam": 16, "taskset": 29, "tbb": 42, "tdp": 31, "team": [7, 54], "techniqu": [15, 28], "technologi": [16, 45], "tee": [29, 37, 51, 62], "tell": 14, "templat": 11, "temporari": 13, "tensor": [11, 16, 25, 28, 30, 40, 53], "tensorboard": [22, 63], "tensorflow": [5, 8, 9, 10, 11, 13, 14, 15, 16, 17, 20, 22, 24, 25, 26, 27, 28, 29, 30, 31, 32, 36, 38, 43, 44, 46, 47, 48, 50, 51, 53, 54, 55, 56, 57, 58, 60, 61, 62], "tensorflow2": [51, 58, 60], "tensorflow2_keras_mnist": 58, "tensorflow_doc": 56, "tensorflow_hub": 22, "tensorflow_model_serv": [3, 34], "tensorflow_plugin": 34, "tensorflow_serv": [3, 34], "tensorflow_src": 40, "term": [0, 25, 30, 63], "termin": 38, "test": [9, 19, 22, 28, 34, 35, 38, 44, 55, 56], "test_accuraci": 28, "test_dataset": 28, "test_func": 28, "test_scor": [19, 28], "test_step": 28, "text": [18, 31, 44], "text2imag": [31, 44], "tf": [11, 14, 15, 19, 22, 25, 26, 27, 28, 29, 30, 33, 35, 37, 39, 40, 41, 42, 51, 52, 53, 62], "tf2": [49, 51, 56], "tf32": [20, 31, 51], "tf_auto_jit_flag": 27, "tf_auto_mixed_precision_graph_rewrite_allowlist_add": 18, "tf_auto_mixed_precision_graph_rewrite_allowlist_remov": 18, "tf_auto_mixed_precision_graph_rewrite_clearlist_add": 18, "tf_auto_mixed_precision_graph_rewrite_clearlist_remov": 18, "tf_auto_mixed_precision_graph_rewrite_denylist_add": 18, "tf_auto_mixed_precision_graph_rewrite_denylist_remov": 18, "tf_auto_mixed_precision_graph_rewrite_inferlist_add": 18, "tf_auto_mixed_precision_graph_rewrite_inferlist_remov": 18, "tf_auto_mixed_precision_graph_rewrite_level": 18, "tf_auto_mixed_precision_graph_rewrite_log_path": 18, "tf_bert_finetune_": 51, "tf_bert_pretraining_lamb_": 51, "tf_check_ok": 40, "tf_code": 40, "tf_compatible_vers": 33, "tf_copt": [11, 34], "tf_cpp_max_vlog_level": 20, "tf_cpp_min_log_level": 20, "tf_cuda_librari": 34, "tf_enable_onednn_opt": 29, "tf_getcod": [11, 40], "tf_hub": 22, "tf_include_path": 40, "tf_kera": 27, "tf_loadpluggabledevicelibrari": 40, "tf_messag": 40, "tf_newopdefinitionbuild": 11, "tf_newstatu": [11, 40], "tf_num_interop_thread": 62, "tf_num_intraop_thread": 62, "tf_ok": [11, 40], "tf_opdefinitionbuild": 11, "tf_opdefinitionbuilderaddattr": 11, "tf_opdefinitionbuilderaddinput": 11, "tf_opdefinitionbuilderaddoutput": 11, "tf_opdefinitionbuildersetshapeinferencefunct": 11, "tf_registeropdefinit": 11, "tf_serv": 34, "tf_statu": 40, "tf_use_legacy_kera": [27, 51, 54], "tf_ver": 2, "tf_xla_auto_jit": [16, 27, 30], "tf_xla_flag": [16, 27, 30], "tf_xla_use_device_api": [16, 30], "tfa": [25, 26, 55], "tfcc_path": 40, "tfd": 61, "tfg": 17, "tfg_optimizer_hook": 62, "tfg_to_h": 17, "tfhub": 22, "tfrecord": [51, 55, 61], "tfx": 21, "than": [19, 25, 28, 32, 35, 37, 42, 47, 53, 58], "thei": [0, 18, 28, 29, 32], "them": [16, 18, 21, 28, 29, 32, 34, 56, 61], "therefor": [28, 32], "thereof": 16, "thi": [0, 2, 3, 4, 5, 11, 13, 14, 16, 17, 18, 19, 20, 21, 23, 24, 25, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 38, 39, 40, 42, 45, 46, 49, 50, 51, 52, 53, 55, 57, 60, 62, 63], "thing": 21, "think": 28, "third": [9, 36, 63], "third_parti": [7, 9, 34], "those": [0, 16, 18, 19, 34, 61], "though": 39, "thrash": 32, "thread": [4, 13, 20, 29, 31, 32, 33, 42], "threadpool": [3, 20, 40], "threaten": 0, "three": [4, 21, 22, 23, 29], "through": [0, 27, 28, 32, 35, 39, 40, 55, 63], "throughput": [31, 47, 51, 54], "throughput_mod": 29, "throughput_train": 51, "thu": 32, "tiger_cat": 48, "tightli": 30, "tile": [17, 20, 33, 51, 58, 60, 61, 62], "time": [0, 4, 11, 14, 16, 18, 19, 20, 21, 22, 28, 31, 32, 35, 39, 40, 45, 49, 51], "timehistori": [61, 62], "tip": [11, 20, 32, 34], "tmp": 34, "todai": 30, "togeth": 32, "toggl": 33, "toi": 28, "token": [54, 56], "too": [18, 28, 37, 42], "tookit": [39, 40], "tool": [7, 9, 11, 14, 18, 32, 36, 37, 38, 39, 40, 42, 63], "toolchain": 39, "toolkit": [14, 31, 37, 38, 45, 47, 58, 63], "top": 27, "topic": 4, "topologi": [21, 29, 32], "total": [31, 32, 35, 49, 51, 58], "total_loss": 51, "total_tim": 35, "total_training_step": 51, "tour": 63, "tout": 24, "toward": 0, "tpl": 7, "tpost": 24, "tpu": 49, "trace": 22, "traceback": 56, "track": [22, 56], "train": [2, 14, 17, 18, 21, 24, 25, 26, 27, 29, 34, 35, 37, 38, 42, 43, 44, 47, 51, 52, 57, 59, 63], "train_accuraci": 62, "train_and_ev": 61, "train_batch_s": [57, 60], "train_batch_size_phase1": 51, "train_batch_size_phase2": 51, "train_dataset": 28, "train_epoch": 62, "train_fil": 57, "train_horovod": 58, "train_loss": [51, 62], "train_maskrcnn": [55, 60], "train_step": [28, 51, 62], "trainabl": [25, 35], "trainable_vari": 28, "trainer": 61, "trainingop": 24, "transfer": 52, "transform": [24, 25], "translat": [0, 39, 40], "transpar": [4, 21], "transpos": [24, 26], "travers": 36, "treat": 20, "tree": [39, 40], "tri": 56, "tricki": 28, "trigger": [5, 19, 33], "troll": 0, "true": [11, 16, 22, 25, 26, 28, 29, 30, 33, 35, 40, 51, 57, 62], "truncat": 34, "try": [11, 21, 29, 45, 49, 52], "ttt": 31, "tumor": 55, "tune": [31, 33, 45, 51], "tupl": 35, "turbo": 31, "turn": [17, 63], "tutori": 56, "two": [4, 13, 14, 19, 21, 23, 28, 32, 35, 39, 47, 51, 54, 55, 60], "txt": [16, 18, 37, 42, 54, 57, 62], "type": [4, 7, 11, 14, 18, 20, 21, 29, 31, 33, 38, 39, 40, 47, 49], "type_infer": 17, "typeconstraint": 11, "typeerror": 56, "typenam": 11, "typic": [4, 21, 23, 28, 32], "u": [0, 22, 29, 42], "ubuntu": [2, 31, 34, 39, 40, 41, 42], "ubuntu22": 56, "ubuntu_vers": 2, "uma": 32, "unaccept": 0, "uncased_l": 51, "unchanged_shape_fn": 11, "undef": 11, "undefin": [2, 30], "under": [17, 23, 26, 29, 33, 39, 52], "understand": 36, "undesir": 29, "unet": [31, 44], "unet_3d_med": 55, "unexpect": 51, "unifi": [21, 29, 37], "uniform": [4, 16, 21, 30, 35], "uniniti": 17, "uninstal": [11, 51, 60], "unit": [19, 25, 28, 32, 35], "unknown": [14, 28], "unkown": 27, "unless": 33, "unmodifi": 16, "unnecessari": [24, 28, 32], "unoptim": 36, "unordered_map": 11, "unprofession": 0, "unsafe_force_al": 18, "unscal": 28, "unshard": 17, "unsolicit": 0, "unspecifi": 29, "until": [18, 32], "unwelcom": 0, "unzip": 40, "up": [18, 22, 28, 32, 37, 40, 44, 51, 54, 57], "updat": [2, 18, 27, 28, 37, 38, 39, 40, 41, 42, 62], "update_st": 28, "upenn": 55, "upgrad": [14, 37, 38, 41, 42, 45, 46, 49, 55, 60, 63], "upon": 55, "upstream": [14, 18], "url": [49, 54, 56], "us": [0, 2, 3, 4, 5, 7, 13, 14, 15, 16, 18, 19, 20, 22, 23, 24, 25, 26, 28, 31, 32, 33, 36, 37, 38, 39, 40, 42, 44, 46, 47, 49, 50, 51, 52, 53, 55, 56, 57, 60, 63], "usag": [4, 14, 16, 21, 32, 33, 35, 44], "use_bia": [25, 26], "use_default_alloc": 29, "use_itex_shard": 62, "use_logical_cor": 29, "use_mytrain": 51, "use_synthetic_data": [60, 62], "use_tf_funct": 62, "use_tf_while_loop": 62, "use_tpu": 57, "use_xla": 51, "usecyclespersecondtim": [4, 21, 22, 28], "user": [4, 5, 7, 11, 13, 19, 20, 21, 23, 27, 30, 37, 39, 40, 41, 42, 43, 47, 54, 63], "usr": [7, 29, 37, 39], "usual": 18, "ut": 7, "util": [4, 9, 11, 14, 16, 21, 23, 29, 31, 32, 35, 56, 62], "v": [2, 3, 16, 18, 34, 38, 40, 42, 46, 47], "v0": [31, 33, 38], "v1": [35, 49, 51, 52, 57, 63], "v100": 51, "v1_8": [35, 47], "v2": [15, 31, 33, 38, 42, 49, 51, 61, 63], "v3": [15, 44], "v4": [18, 35, 44], "val_accuraci": 28, "val_loss": 28, "valid": [8, 33], "validation_split": [19, 28, 35], "valu": [15, 17, 18, 20, 25, 28, 29, 31, 32, 33, 61], "valueerror": 33, "var": [2, 14, 34, 38, 39, 40, 42], "vari": 27, "variabl": [2, 4, 13, 15, 16, 19, 21, 22, 23, 24, 25, 27, 28, 30, 32, 34, 35, 38, 40, 52], "variable_dtyp": 28, "varianc": 25, "varibl": 51, "varieti": 44, "variou": 16, "ve": [39, 40], "vector": 40, "venv": [46, 55, 58, 60], "verbos": [11, 19, 20, 28, 29, 30, 35], "veri": [15, 28, 51], "verifi": [38, 39, 40, 44, 51, 54, 55, 56, 57, 60, 61, 62], "version": [0, 2, 11, 14, 16, 27, 28, 31, 32, 37, 38, 39, 40, 41, 42, 45, 46, 51, 56], "versu": [19, 32], "via": [0, 4, 11, 17, 27, 30, 31, 35, 44, 62, 63], "view": 8, "viewer": 22, "viewpoint": 0, "violat": 0, "virtual": [39, 40, 51, 52, 54, 55, 56, 57, 60, 61, 62], "virtual_env": 29, "visibl": [0, 2, 11, 34], "vision": 30, "visit": 63, "vnni": 52, "vocab": [16, 57], "vocab_fil": [16, 57], "void": 11, "volum": 55, "vulner": 63, "vz": 40, "w": [28, 31, 35, 44], "wa": [0, 29, 32, 33, 39, 40], "wai": [0, 16, 19, 28, 30, 34, 36, 38], "wait": 32, "want": [3, 5, 7, 28, 29, 37, 39, 40, 42, 51, 54, 57, 60], "warm": [22, 35], "warmup": 35, "warmup_step": 55, "warmup_steps_phase1": 51, "warmup_steps_phase2": 51, "warn": [28, 29, 40, 51], "wd": [25, 31], "wd_black": 31, "we": [0, 2, 7, 11, 24, 27, 28, 31, 32, 33, 34, 35, 38, 39, 40, 45, 46, 47, 49, 51, 52, 54, 55, 56, 57, 60, 61, 63], "weak": 31, "web": [5, 56], "websit": [45, 63], "weight": [4, 13, 25, 28, 51, 53, 62], "weight_decai": [25, 26], "welcom": [0, 7, 63], "well": [0, 2, 8, 11, 21, 26, 28, 29, 30, 31, 32, 51], "were": [0, 16, 29, 32], "wether": 27, "wget": [2, 7, 32, 35, 37, 39, 40, 42, 47, 49, 56, 58], "what": [0, 14, 28], "wheel": [2, 38, 39], "when": [0, 5, 14, 17, 19, 24, 27, 28, 29, 32, 34, 35, 36, 37, 39, 40, 51, 52, 55, 56, 60], "where": [25, 28, 31, 32, 39, 49], "wherea": 61, "wherebi": 32, "whether": [24, 29, 32], "which": [0, 4, 7, 9, 13, 14, 15, 16, 17, 18, 19, 20, 24, 28, 29, 30, 32, 33, 35, 36, 37, 39, 40, 42, 45, 46, 52, 57], "while": [16, 21, 28, 31, 32, 33, 34, 39, 48, 53, 56], "whitespac": 51, "whitlei": 31, "whl": [2, 11, 39, 40, 63], "whole": [18, 20, 33, 51], "whole_seq_output": 25, "whose": 18, "why": 0, "wide": [14, 25, 36, 44], "wiki": 0, "wiki_onli": 51, "wikicorpus_en": 51, "wikipedia": [31, 32, 51], "wish": 39, "within": [0, 15, 25, 30, 37, 51], "without": [0, 4, 16, 18, 20, 21, 23, 28, 30, 31, 39, 40, 44, 52, 56, 63], "withsum": 24, "wl": 40, "wno": 34, "won": [5, 29, 36], "work": [1, 4, 7, 14, 15, 19, 20, 21, 27, 28, 29, 32, 35, 36, 40, 42, 45, 49, 52], "worker": 28, "workflow": 16, "workload": [2, 4, 16, 32, 35, 44, 52, 60, 63], "workspac": [2, 3, 34], "world": 28, "wors": 47, "would": [28, 37, 39, 61], "wrap": 28, "wrap_funct": 35, "wrapper": [28, 42], "write": [5, 7, 16, 19], "written": [0, 7, 27], "wrong": [39, 40], "ws1": 47, "wu": 25, "www": [0, 21, 42], "x": [11, 19, 25, 26, 28, 31, 39, 40, 47, 53, 58], "x15": 14, "x710": 31, "x86_64": [38, 39, 40], "x_test": [19, 28, 35], "x_train": [19, 28, 35], "xe": 31, "xeon": [4, 21, 31, 32, 35, 39, 40, 41, 44, 47], "xfd": 11, "xla": [4, 16, 27], "xla_global_id": 2, "xpu": [2, 4, 11, 14, 17, 19, 22, 25, 26, 28, 30, 33, 37, 38, 43, 45, 46, 47, 48, 49, 53, 54, 55, 58, 60], "xpu_force_sync": 33, "xpu_lib_path": 40, "xpuautoshard": [4, 33, 44], "xx": [34, 61], "xxx": [7, 52, 56], "xxxx": [58, 61], "xxxxx": [34, 51, 62], "xxxxxx": 11, "xxxxxxxx": 52, "xzf": 7, "xzvf": 32, "y": [11, 25, 26, 28, 35, 37, 39, 40, 47, 58, 63], "y_test": [19, 28, 35], "y_train": [19, 28, 35], "yaml": 61, "ye": [19, 38], "you": [2, 3, 4, 5, 7, 8, 11, 13, 14, 16, 17, 18, 20, 21, 22, 23, 28, 29, 30, 31, 32, 33, 34, 35, 37, 38, 39, 40, 41, 42, 45, 46, 47, 48, 49, 51, 52, 53, 54, 55, 56, 57, 60, 61, 62], "your": [2, 3, 5, 7, 14, 27, 30, 32, 34, 35, 37, 38, 39, 40, 41, 42, 46, 47, 49, 51, 52, 54, 56, 62, 63], "your_script": 29, "your_script_arg": 29, "yourself": 29, "yuxin": 25, "yyi": 52, "yym": 58, "yyyi": 58, "z": [40, 58], "ze_api": 14, "ze_enable_tracing_lay": [4, 21, 22, 28], "zero": [14, 25, 26, 28, 37], "zip": 28, "zoo": 44, "zxvf": 49, "zzz": 7, "zzzz": 58}, "titles": ["Contributor Covenant Code of Conduct", "Security Policy", "Intel\u00ae Extension for TensorFlow* Docker Container Guide", "Intel\u00ae Extension for TensorFlow* Serving - Docker Container Guide", "Welcome to Intel\u00ae Extension for TensorFlow* documentation", "Online Documentation Build Guide", "Welcome to Intel \u00ae Extension for TensorFlow* documentation!", "Contributing guidelines", "Releases", "Directory Tree Structure", "Extension Design", "How to write custom op", "Optimizations Design", "oneDNN object cache optimization", "Frequently Asked Questions", "INT8 Quantization", "OpenXLA", "XPUAutoShard on GPU [Experimental]", "Tune Advanced Auto Mixed Precision", "Advanced Auto Mixed Precision", "Environment Variables", "Features", "GPU Profiler", "Infrastructure", "Graph fusion", "Customized Operators", "Operators Override", "Keras 3 Overview", "Keras Mixed Precision", "Launch Script User Guide", "NextPluggableDevice Overview", "Performance Data", "Practice Guide", "Python APIs", "Install TensorFlow Serving with Intel\u00ae Extension for TensorFlow*", "Selecting Thread Pool in Intel\u00ae Extension for TensorFlow* CPU [Experimental]", "Online Weight Prepack", "<em>Experimental:</em> Intel\u00ae Arc\u2122 A-Series GPU Software Installation", "Conda Environment Installation Instructions", "Overview", "Intel\u00ae Extension for TensorFlow* for C++", "Intel CPU Software Installation", "Intel XPU Software Installation", "Installation Guide", "Examples", "Accelerate AlexNet by Quantization with Intel\u00ae Extension for Tensorflow*", "Common Guide for Running", "Speed up Inference of Inception v4 by Advanced Automatic Mixed Precision on Intel CPU and GPU via Docker Container or Bare Metal", "ResNet50 Inference on Intel CPU and GPU", "Intel\u00ae Extension for Tensorflow* Model Quantization API Example", "Accelerate Deep Learning Training and Inference for Model Zoo Workloads on Intel GPU", "Accelerate BERT-Large Pretraining on Intel GPU", "Quantize Inception V3 by Intel\u00ae Extension for Tensorflow* on Intel\u00ae Xeon\u00ae", "Quick Example on Intel CPU and GPU", "Stable Diffusion Inference for Text2Image on Intel GPU", "Accelerate 3D-Unet Training w/o horovod for medical image segmentation on Intel GPU", "BERT Training for Classifying Text on Intel CPU and GPU", "FP8 BERT-Large Fine-tuning for Classifying Text on Intel GPU", "Distributed Training Example with Intel\u00ae Optimization for Horovod* on Intel\u00ae GPU", "Refer to train_resnet50", "Accelerate Mask R-CNN Training on Intel GPU", "Resnet50 train on Intel GPU", "Accelerate ResNet50 Training by XPUAutoShard on Intel GPU", "Intel\u00ae Extension for TensorFlow*", "Welcome to Intel \u00ae Extension for TensorFlow* documentation!"], "titleterms": {"1": [0, 11, 31, 34, 37, 40], "1550": 31, "17": 39, "170": 31, "1x": 31, "2": [0, 11, 34, 37, 40], "3": [0, 11, 27, 37], "3d": [31, 55], "4": [0, 11, 31, 37], "4x": 31, "5": 31, "6": 11, "7": 11, "8": 11, "9": 11, "A": 37, "By": 37, "For": [39, 40], "If": 61, "That": 2, "With": 62, "acceler": [45, 50, 51, 55, 60, 62], "access": [2, 32], "accuraci": [31, 54, 57], "activ": 26, "adamw": 26, "adamwithweightdecayoptim": 25, "add": 11, "addit": [31, 39], "advanc": [18, 19, 21, 23, 29, 47, 52], "ai": 31, "alexnet": 45, "all": 29, "alloc": [29, 32], "amp": [19, 21, 47], "api": [17, 18, 20, 21, 23, 33, 47, 48, 49, 54, 62], "appli": [49, 58, 61], "arc": 37, "architectur": [23, 30], "ask": 14, "attribut": [0, 18], "auto": [18, 19, 20, 21], "automat": 47, "automixedprecisionopt": 33, "b0": 31, "b3": 31, "backend": 20, "background": [18, 45, 52], "ban": 0, "bare": [41, 42, 47, 50], "base": [39, 40, 42, 45, 46], "basic": [24, 29], "bazel": [7, 39, 40], "bert": [31, 51, 56, 57], "bf16": 57, "binari": [2, 3, 63], "boost": 52, "build": [2, 3, 5, 11, 14, 28, 34, 39, 40, 41, 42], "c": [7, 34, 40], "cach": 13, "case": 27, "cc": 40, "center": 31, "chang": [8, 51, 54, 55, 57, 60, 61], "channel": 63, "check": [30, 42, 52, 58], "clang": 39, "classifi": [56, 57], "clone": [47, 58], "cnn": 60, "code": [0, 7, 17, 19, 39, 40, 51, 53, 54, 55, 56, 57, 58, 60, 61, 62], "command": [51, 58, 61, 62], "common": [29, 39, 40, 46], "compar": 47, "compat": 63, "compil": 39, "compressor": 49, "conda": [38, 39, 40], "conduct": 0, "config": [20, 33], "configproto": 33, "configur": [18, 20, 31, 32, 39, 40, 47, 52], "constant": 52, "contain": [2, 3, 41, 42, 47, 50], "content": 32, "contribut": [7, 63], "contributor": 0, "control": 29, "converg": 51, "convolut": 13, "core": 29, "correct": 0, "count": 58, "coven": 0, "cpu": [21, 32, 35, 39, 40, 41, 42, 47, 48, 52, 53, 54, 56, 61, 63], "creat": [5, 39, 40, 58], "current": 30, "custom": [2, 11, 19, 23, 25, 28], "data": [19, 24, 31], "dataset": [49, 51, 55, 60, 61], "debug": 7, "debugopt": 33, "deep": [50, 52], "default": 29, "defin": 11, "definit": 20, "dens": 26, "depend": 58, "deprec": 42, "descript": [2, 3], "design": [10, 12, 29], "detail": 24, "devcloud": [45, 52], "develop": 7, "devic": [30, 58], "differ": [18, 27, 28], "diffus": [31, 54], "directli": 37, "directori": 9, "disabl": 52, "distribut": 58, "docker": [2, 3, 34, 41, 42, 47, 50], "dockerfil": [34, 41, 42], "dockerhub": [41, 42], "document": [4, 5, 6, 7, 63, 64], "download": [39, 40, 47, 56, 58], "driver": [37, 39, 40, 42, 46], "dtype": 28, "dump": 17, "eas": 21, "effect": 36, "efficientnet": 31, "eigen": 35, "enabl": [19, 46, 47, 48, 51, 52, 54, 55, 56, 57, 58, 60, 61, 62], "end": 18, "enforc": 0, "engin": 23, "environ": [18, 20, 29, 33, 37, 38, 39, 40, 41, 42, 45, 46, 47, 48, 49, 51, 52, 54, 55, 56, 57, 58, 60, 61, 62], "error": 27, "exampl": [16, 17, 18, 19, 22, 29, 35, 39, 40, 44, 48, 49, 51, 53, 54, 55, 57, 58, 60, 61, 62], "execut": [29, 45, 47, 48, 51, 54, 55, 56, 57, 58, 60, 61, 62], "experiment": [17, 21, 35, 37], "extens": [2, 3, 4, 6, 7, 10, 23, 33, 34, 35, 37, 39, 40, 41, 42, 45, 49, 52, 63, 64], "extra": [39, 40], "extract": 40, "faq": [22, 47, 48, 51, 54, 55, 56, 57, 60], "featur": [19, 21, 23], "file": 40, "fine": 57, "finetun": 51, "fit": 28, "flex": 31, "fold": 52, "format": 32, "fp16": 54, "fp32": [47, 54], "fp8": 57, "frequent": 14, "from": [2, 14, 34, 40, 41, 42], "full": 37, "function": 52, "further": 62, "fusion": 24, "gelu": [25, 26], "gener": 24, "get": [41, 42], "get_config": 33, "gnu": 32, "gpu": [2, 17, 21, 22, 31, 32, 37, 39, 40, 42, 45, 46, 47, 48, 50, 51, 52, 53, 54, 55, 56, 57, 58, 60, 61, 62], "gpuoption": 33, "graph": [17, 19, 21, 24, 33, 52], "graphopt": 33, "groupnorm": 25, "guid": [2, 3, 5, 7, 29, 32, 43, 46, 50], "guidelin": [0, 7], "hardwar": [28, 31, 32, 37, 39, 40, 41, 42, 45, 47, 51, 52, 54, 55, 56, 57, 60, 61, 62, 63], "header": 40, "highlight": 4, "horovod": [55, 58, 61], "how": [11, 16, 28], "hvd": 61, "i": [2, 3, 29], "identifi": 28, "ii": [2, 3, 29], "iii": [2, 29], "imag": [3, 31, 34, 55], "imagenet": 61, "implement": [11, 24], "import": 33, "improv": 18, "incept": [47, 52], "includ": 29, "incompat": 8, "index": 29, "infer": [29, 31, 47, 48, 50, 54], "infrastructur": 23, "instal": [11, 34, 37, 38, 39, 40, 41, 42, 43, 49, 53, 58, 62, 63], "instanc": [26, 29], "instruct": [37, 38], "int8": [15, 21], "integr": 40, "intel": [2, 3, 4, 6, 7, 23, 31, 32, 33, 34, 35, 37, 39, 40, 41, 42, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 60, 61, 62, 63, 64], "intel_extension_for_tensorflow": 33, "interfac": 11, "introduct": [5, 13, 23, 45, 47, 50, 51, 52, 54, 55, 56, 57, 60, 61, 62], "issu": 8, "itex": [25, 33], "itex_verbos": 20, "itexlstm": 25, "iv": 29, "ix": 29, "jemalloc": 29, "jupyt": [52, 54, 56], "kera": [27, 28], "kernel": 11, "known": 8, "lamboptim": 25, "larg": [31, 51, 57], "latenc": 29, "latest": 5, "launch": 29, "launcher": 21, "layer": 26, "layernorm": 25, "layout": [24, 32], "lead": 27, "learn": [50, 52], "level": 20, "librari": [34, 40], "licens": [52, 63], "limit": 36, "linker": 40, "linux": 37, "list": 18, "load": 40, "local": [5, 45, 52], "log": [19, 29], "logic": 29, "loop": 28, "loss": 28, "lstm": 26, "manag": 23, "manual": 19, "mask": [31, 60], "matrix": 52, "max": 31, "medic": [31, 55], "memori": [29, 32], "metal": [41, 42, 47, 50], "method": 47, "mix": [18, 19, 20, 21, 24, 28, 47], "mobilenet": 18, "mode": 29, "model": [28, 31, 34, 47, 49, 50, 51, 54, 55, 57, 60, 61], "multi": [29, 55], "multipl": 29, "name": 33, "nativ": 37, "net": 31, "neural": 49, "nextpluggabledevic": 30, "node": [29, 31], "non": 32, "normal": 26, "note": 53, "notebook": [52, 54, 56], "notic": 19, "numa": [29, 32], "numactl": 32, "number": 29, "numer": 18, "o": 55, "object": [13, 16], "omp_num_thread": 32, "one": 29, "oneapi": [37, 39, 40, 42, 46, 58], "onednn": [13, 52], "onli": [39, 40, 42], "onlin": [5, 36], "op": [11, 25, 33], "openmp": [32, 35], "openxla": [16, 21, 30], "oper": [19, 21, 25, 26, 33], "optim": [12, 13, 19, 21, 24, 58], "option": [20, 37, 39, 40, 58], "origin": 19, "other": 62, "our": 0, "output": [48, 53, 54, 58, 61, 62], "overflow": 28, "overrid": [26, 33], "overview": [15, 16, 17, 19, 20, 27, 28, 29, 30, 31, 32, 33, 36, 39, 49], "packag": [11, 40, 42, 62], "paramet": [61, 62], "patch": [58, 61], "perform": [18, 27, 31, 47], "perman": 0, "phase2": 31, "physic": 29, "pjrt": 30, "platform": 42, "pledg": 0, "pluggabledevic": 30, "plugin": 30, "polici": [1, 28], "pool": 35, "practic": 32, "pre": 49, "precis": [18, 19, 20, 21, 28, 47], "precondit": 38, "prepack": 36, "prepar": [2, 3, 40, 44, 46, 47, 48, 49, 51, 54, 55, 56, 57, 58, 60, 61, 62], "prerequisit": [11, 33, 48, 51, 54, 55, 56, 57, 60, 61, 62], "preserv": 33, "pretrain": [47, 51], "product": 31, "profil": [21, 22], "protocol": [20, 33], "public": 23, "py": 53, "pypi": [37, 39, 41, 42], "python": [7, 11, 17, 18, 20, 21, 33, 40, 47, 48, 54, 62], "pythonpath": 62, "quantiz": [15, 21, 45, 49, 52], "question": 14, "quick": [19, 50, 53], "quick_exampl": 53, "r": 60, "rcnn": 31, "recommend": 40, "refer": [16, 36, 59], "regist": 11, "releas": [5, 8, 37], "repo": 58, "report": 1, "repositori": 47, "requir": [37, 39, 40, 41, 42, 47, 51, 54, 55, 56, 57, 60, 61, 62, 63], "resnet50": [48, 61, 62], "resnet50v1": 31, "resourc": [10, 63], "respons": 0, "result": [31, 47, 51], "rule": 18, "run": [2, 3, 34, 37, 40, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 60, 61, 62], "runtim": [14, 30], "sampl": 34, "save": 19, "scale": 28, "scope": 0, "script": [2, 29, 46], "secur": [1, 63], "segment": 55, "select": 35, "seri": 37, "serv": [3, 21, 34], "server": [34, 45, 52], "set": [28, 29, 45, 49, 61, 62], "set_config": 33, "setup": [19, 28, 37, 42, 46, 47, 48, 51, 54, 55, 56, 57, 58, 60, 61, 62], "shard": 62, "shardingconfig": 33, "singl": [29, 55], "situat": 27, "skip": [47, 48, 54, 56, 61], "softwar": [31, 32, 37, 41, 42, 49, 63], "sourc": [14, 34, 39, 40], "speed": 47, "stabil": 18, "stabl": [31, 54], "standard": 0, "start": [30, 50], "startup": [52, 56], "step": [37, 38, 47, 48, 54, 56, 61], "stock": [18, 19], "structur": [9, 17], "style": 7, "subsystem": 37, "support": [21, 63], "switch": 30, "system": [37, 41, 42], "tabl": [32, 63], "tcmalloc": [29, 32], "temporari": 0, "tensorflow": [2, 3, 4, 6, 7, 18, 19, 21, 23, 33, 34, 35, 37, 39, 40, 41, 42, 45, 49, 52, 63, 64], "test": [5, 7, 47], "text": [56, 57], "text2imag": 54, "tf_num_interop_thread": 29, "tf_num_intraop_thread": 29, "thi": [47, 48, 54, 56, 61], "thread": 35, "throughput": 29, "tile": 55, "tip": [7, 19], "toolkit": [39, 40, 42, 46], "train": [19, 28, 31, 49, 50, 55, 56, 58, 60, 61, 62], "train_resnet50": 59, "tree": 9, "troubleshoot": 14, "tune": [18, 19, 57], "type": [19, 24, 28, 30], "u": 31, "ubuntu": 37, "underflow": 28, "unet": 55, "uniform": 32, "unit": 7, "up": [45, 47, 49], "updat": 5, "us": [11, 21, 27, 29, 30, 34, 35, 61], "usag": [2, 15, 17, 18, 19, 22, 26, 29, 36], "user": 29, "v": [19, 29], "v1": 31, "v3": 52, "v4": 47, "variabl": [18, 20, 29, 33, 37, 42, 47], "vasriabl": 54, "verifi": [2, 11, 37, 41, 42], "version": [5, 33, 52], "vi": 29, "via": [20, 37, 41, 42, 47], "vii": 29, "viii": 29, "virtual": [37, 41, 42, 46, 58], "vulner": 1, "w": 55, "warn": [0, 27], "weekli": 63, "weight": 36, "welcom": [4, 6, 64], "wheel": [37, 41, 42], "why": 30, "window": 37, "without": [61, 62], "work": 16, "workflow": [10, 15, 17, 36], "workload": [31, 50], "write": 11, "wsl2": 37, "x": 29, "xeon": 52, "xla": 30, "xpu": [23, 39, 40, 42, 63], "xpuautoshard": [17, 21, 62], "your": 29, "zoo": 50}})
\ No newline at end of file