diff --git a/_sources/features/custom_scripts.md.txt b/_sources/features/custom_scripts.md.txt
index f4a8b6669..14ab4ba22 100644
--- a/_sources/features/custom_scripts.md.txt
+++ b/_sources/features/custom_scripts.md.txt
@@ -51,8 +51,8 @@ Use `my_script.py` with Olive workflow configuration json file(sub_types name sh
         "type": "accuracy",
         "sub_types": [
             {"name": "accuracy_score", "priority": 1, "goal": {"type": "max-degradation", "value": 0.01}},
-            {"name": "f1_score", "metric_config": {"multiclass": false}},
-            {"name": "auroc", "metric_config": {"num_classes": 2}}
+            {"name": "f1_score"},
+            {"name": "auroc"}
         ],
         "user_config":{
             "post_processing_func": "post_process",
@@ -103,8 +103,8 @@ Use `script_dir` and `my_script.py` with Olive workflow configuration json file:
         "type": "accuracy",
         "sub_types": [
             {"name": "accuracy_score", "priority": 1, "goal": {"type": "max-degradation", "value": 0.01}},
-            {"name": "f1_score", "metric_config": {"multiclass": false}},
-            {"name": "auroc", "metric_config": {"num_classes": 2}}
+            {"name": "f1_score"},
+            {"name": "auroc"}
         ]
         "user_config":{
             "post_processing_func": "post_process",
diff --git a/_sources/overview/options.md.txt b/_sources/overview/options.md.txt
index ae6b31e50..9870fa72e 100644
--- a/_sources/overview/options.md.txt
+++ b/_sources/overview/options.md.txt
@@ -233,7 +233,7 @@ information of the evaluator contains following items:
     - `type: [str]` The type of the metric. The supported types are `accuracy`, `latency`, `throughput` and `custom`.
 
     - `backend: [str]` The type of metrics' backend. Olive implement `torch_metrics` and `huggingface_metrics` backends. The default value is `torch_metrics`.
-        - `torch_metrics` backend uses `torchmetrics` library to compute metrics. It supports `accuracy_score`, `f1_score`, `precision`, `recall` and `auc` metrics.
+        - `torch_metrics` backend uses `torchmetrics`(>=0.1.0) library to compute metrics. It supports `accuracy_score`, `f1_score`, `precision`, `recall` and `auroc` metrics which are used for `binary` task (equal to `metric_config:{"task": "binary"}`) by default. You need alter the `task` if needed. Please refer to [torchmetrics](https://lightning.ai/docs/torchmetrics/stable/) for more details.
         - `huggingface_metrics` backend uses huggingface `evaluate` library to compute metrics. The supported metrics can be found at [huggingface metrics](https://huggingface.co/metrics).
 
     - `subtypes: [List[Dict]]` The subtypes of the metric. Cannot be null or empty. Each subtype is a dictionary that contains following items:
@@ -311,8 +311,8 @@ information of the evaluator contains following items:
                 "type": "accuracy",
                 "sub_types": [
                     {"name": "accuracy_score", "priority": 1, "goal": {"type": "max-degradation", "value": 0.01}},
-                    {"name": "f1_score", "metric_config": {"multiclass": false}},
-                    {"name": "auroc", "metric_config": {"num_classes": 2}}
+                    {"name": "f1_score"},
+                    {"name": "auroc"}
                 ],
                 "user_config":{
                     "post_processing_func": "post_process",
diff --git a/_sources/tutorials/configure_metrics.rst.txt b/_sources/tutorials/configure_metrics.rst.txt
index ff45262e1..882272cc7 100644
--- a/_sources/tutorials/configure_metrics.rst.txt
+++ b/_sources/tutorials/configure_metrics.rst.txt
@@ -19,8 +19,8 @@ Accuracy Metric
                 "type": "accuracy",
                 "sub_types": [
                     {"name": "accuracy_score", "priority": 1, "goal": {"type": "max-degradation", "value": 0.01}},
-                    {"name": "f1_score", "metric_config": {"multiclass": false}},
-                    {"name": "auroc", "metric_config": {"num_classes": 2}}
+                    {"name": "f1_score"},
+                    {"name": "auroc"}
                 ],
                 "user_config": {
                     "post_processing_func": "post_process",
@@ -227,8 +227,8 @@ If you have multiple metrics to evaluate, you can configure them in the followin
                     "type": "accuracy",
                     "sub_types": [
                         {"name": "accuracy_score", "priority": 1, "goal": {"type": "max-degradation", "value": 0.01}},
-                        {"name": "f1_score", "metric_config": {"multiclass": false}},
-                        {"name": "auroc", "metric_config": {"num_classes": 2}}
+                        {"name": "f1_score"},
+                        {"name": "auroc"}
                     ]
                 },
                 {
diff --git a/features/custom_scripts.html b/features/custom_scripts.html
index 86510ad66..7a7a24374 100644
--- a/features/custom_scripts.html
+++ b/features/custom_scripts.html
@@ -184,8 +184,8 @@ <h3>Examples<a class="headerlink" href="#examples" title="Permalink to this head
         <span class="s2">&quot;type&quot;</span><span class="p">:</span> <span class="s2">&quot;accuracy&quot;</span><span class="p">,</span>
         <span class="s2">&quot;sub_types&quot;</span><span class="p">:</span> <span class="p">[</span>
             <span class="p">{</span><span class="s2">&quot;name&quot;</span><span class="p">:</span> <span class="s2">&quot;accuracy_score&quot;</span><span class="p">,</span> <span class="s2">&quot;priority&quot;</span><span class="p">:</span> <span class="mi">1</span><span class="p">,</span> <span class="s2">&quot;goal&quot;</span><span class="p">:</span> <span class="p">{</span><span class="s2">&quot;type&quot;</span><span class="p">:</span> <span class="s2">&quot;max-degradation&quot;</span><span class="p">,</span> <span class="s2">&quot;value&quot;</span><span class="p">:</span> <span class="mf">0.01</span><span class="p">}},</span>
-            <span class="p">{</span><span class="s2">&quot;name&quot;</span><span class="p">:</span> <span class="s2">&quot;f1_score&quot;</span><span class="p">,</span> <span class="s2">&quot;metric_config&quot;</span><span class="p">:</span> <span class="p">{</span><span class="s2">&quot;multiclass&quot;</span><span class="p">:</span> <span class="n">false</span><span class="p">}},</span>
-            <span class="p">{</span><span class="s2">&quot;name&quot;</span><span class="p">:</span> <span class="s2">&quot;auroc&quot;</span><span class="p">,</span> <span class="s2">&quot;metric_config&quot;</span><span class="p">:</span> <span class="p">{</span><span class="s2">&quot;num_classes&quot;</span><span class="p">:</span> <span class="mi">2</span><span class="p">}}</span>
+            <span class="p">{</span><span class="s2">&quot;name&quot;</span><span class="p">:</span> <span class="s2">&quot;f1_score&quot;</span><span class="p">},</span>
+            <span class="p">{</span><span class="s2">&quot;name&quot;</span><span class="p">:</span> <span class="s2">&quot;auroc&quot;</span><span class="p">}</span>
         <span class="p">],</span>
         <span class="s2">&quot;user_config&quot;</span><span class="p">:{</span>
             <span class="s2">&quot;post_processing_func&quot;</span><span class="p">:</span> <span class="s2">&quot;post_process&quot;</span><span class="p">,</span>
@@ -230,8 +230,8 @@ <h3>Examples<a class="headerlink" href="#id1" title="Permalink to this heading">
         <span class="s2">&quot;type&quot;</span><span class="p">:</span> <span class="s2">&quot;accuracy&quot;</span><span class="p">,</span>
         <span class="s2">&quot;sub_types&quot;</span><span class="p">:</span> <span class="p">[</span>
             <span class="p">{</span><span class="s2">&quot;name&quot;</span><span class="p">:</span> <span class="s2">&quot;accuracy_score&quot;</span><span class="p">,</span> <span class="s2">&quot;priority&quot;</span><span class="p">:</span> <span class="mi">1</span><span class="p">,</span> <span class="s2">&quot;goal&quot;</span><span class="p">:</span> <span class="p">{</span><span class="s2">&quot;type&quot;</span><span class="p">:</span> <span class="s2">&quot;max-degradation&quot;</span><span class="p">,</span> <span class="s2">&quot;value&quot;</span><span class="p">:</span> <span class="mf">0.01</span><span class="p">}},</span>
-            <span class="p">{</span><span class="s2">&quot;name&quot;</span><span class="p">:</span> <span class="s2">&quot;f1_score&quot;</span><span class="p">,</span> <span class="s2">&quot;metric_config&quot;</span><span class="p">:</span> <span class="p">{</span><span class="s2">&quot;multiclass&quot;</span><span class="p">:</span> <span class="n">false</span><span class="p">}},</span>
-            <span class="p">{</span><span class="s2">&quot;name&quot;</span><span class="p">:</span> <span class="s2">&quot;auroc&quot;</span><span class="p">,</span> <span class="s2">&quot;metric_config&quot;</span><span class="p">:</span> <span class="p">{</span><span class="s2">&quot;num_classes&quot;</span><span class="p">:</span> <span class="mi">2</span><span class="p">}}</span>
+            <span class="p">{</span><span class="s2">&quot;name&quot;</span><span class="p">:</span> <span class="s2">&quot;f1_score&quot;</span><span class="p">},</span>
+            <span class="p">{</span><span class="s2">&quot;name&quot;</span><span class="p">:</span> <span class="s2">&quot;auroc&quot;</span><span class="p">}</span>
         <span class="p">]</span>
         <span class="s2">&quot;user_config&quot;</span><span class="p">:{</span>
             <span class="s2">&quot;post_processing_func&quot;</span><span class="p">:</span> <span class="s2">&quot;post_process&quot;</span><span class="p">,</span>
diff --git a/overview/options.html b/overview/options.html
index 19be5205c..39626277d 100644
--- a/overview/options.html
+++ b/overview/options.html
@@ -433,7 +433,7 @@ <h2>Evaluators Information<a class="headerlink" href="#evaluators-information" t
 <li><p><code class="docutils literal notranslate"><span class="pre">type:</span> <span class="pre">[str]</span></code> The type of the metric. The supported types are <code class="docutils literal notranslate"><span class="pre">accuracy</span></code>, <code class="docutils literal notranslate"><span class="pre">latency</span></code>, <code class="docutils literal notranslate"><span class="pre">throughput</span></code> and <code class="docutils literal notranslate"><span class="pre">custom</span></code>.</p></li>
 <li><p><code class="docutils literal notranslate"><span class="pre">backend:</span> <span class="pre">[str]</span></code> The type of metrics’ backend. Olive implement <code class="docutils literal notranslate"><span class="pre">torch_metrics</span></code> and <code class="docutils literal notranslate"><span class="pre">huggingface_metrics</span></code> backends. The default value is <code class="docutils literal notranslate"><span class="pre">torch_metrics</span></code>.</p>
 <ul>
-<li><p><code class="docutils literal notranslate"><span class="pre">torch_metrics</span></code> backend uses <code class="docutils literal notranslate"><span class="pre">torchmetrics</span></code> library to compute metrics. It supports <code class="docutils literal notranslate"><span class="pre">accuracy_score</span></code>, <code class="docutils literal notranslate"><span class="pre">f1_score</span></code>, <code class="docutils literal notranslate"><span class="pre">precision</span></code>, <code class="docutils literal notranslate"><span class="pre">recall</span></code> and <code class="docutils literal notranslate"><span class="pre">auc</span></code> metrics.</p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">torch_metrics</span></code> backend uses <code class="docutils literal notranslate"><span class="pre">torchmetrics</span></code>(&gt;=0.1.0) library to compute metrics. It supports <code class="docutils literal notranslate"><span class="pre">accuracy_score</span></code>, <code class="docutils literal notranslate"><span class="pre">f1_score</span></code>, <code class="docutils literal notranslate"><span class="pre">precision</span></code>, <code class="docutils literal notranslate"><span class="pre">recall</span></code> and <code class="docutils literal notranslate"><span class="pre">auroc</span></code> metrics which are used for <code class="docutils literal notranslate"><span class="pre">binary</span></code> task (equal to <code class="docutils literal notranslate"><span class="pre">metric_config:{&quot;task&quot;:</span> <span class="pre">&quot;binary&quot;}</span></code>) by default. You need alter the <code class="docutils literal notranslate"><span class="pre">task</span></code> if needed. Please refer to <a class="reference external" href="https://lightning.ai/docs/torchmetrics/stable/">torchmetrics</a> for more details.</p></li>
 <li><p><code class="docutils literal notranslate"><span class="pre">huggingface_metrics</span></code> backend uses huggingface <code class="docutils literal notranslate"><span class="pre">evaluate</span></code> library to compute metrics. The supported metrics can be found at <a class="reference external" href="https://huggingface.co/metrics">huggingface metrics</a>.</p></li>
 </ul>
 </li>
@@ -507,8 +507,8 @@ <h3>Example<a class="headerlink" href="#id3" title="Permalink to this heading">
 <span class="w">                </span><span class="nt">&quot;type&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;accuracy&quot;</span><span class="p">,</span>
 <span class="w">                </span><span class="nt">&quot;sub_types&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span>
 <span class="w">                    </span><span class="p">{</span><span class="nt">&quot;name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;accuracy_score&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;priority&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">1</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;goal&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span><span class="nt">&quot;type&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;max-degradation&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;value&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">0.01</span><span class="p">}},</span>
-<span class="w">                    </span><span class="p">{</span><span class="nt">&quot;name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;f1_score&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;metric_config&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span><span class="nt">&quot;multiclass&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">false</span><span class="p">}},</span>
-<span class="w">                    </span><span class="p">{</span><span class="nt">&quot;name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;auroc&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;metric_config&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span><span class="nt">&quot;num_classes&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">2</span><span class="p">}}</span>
+<span class="w">                    </span><span class="p">{</span><span class="nt">&quot;name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;f1_score&quot;</span><span class="p">},</span>
+<span class="w">                    </span><span class="p">{</span><span class="nt">&quot;name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;auroc&quot;</span><span class="p">}</span>
 <span class="w">                </span><span class="p">],</span>
 <span class="w">                </span><span class="nt">&quot;user_config&quot;</span><span class="p">:{</span>
 <span class="w">                    </span><span class="nt">&quot;post_processing_func&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;post_process&quot;</span><span class="p">,</span>
diff --git a/searchindex.js b/searchindex.js
index 10e6ed8d2..f77493018 100644
--- a/searchindex.js
+++ b/searchindex.js
@@ -1 +1 @@
-Search.setIndex({"docnames": ["api/engine", "api/evaluator", "api/metric", "api/models", "api/passes", "api/resource_path", "api/search-algorithms", "api/systems", "examples", "extending_olive/design", "extending_olive/how_to_add_optimization_pass", "features/azureml_integration", "features/custom_scripts", "features/huggingface_model_optimization", "features/model_transformations_and_optimizations", "features/packaging_output_models", "features/passes/onnx", "features/passes/openvino", "features/passes/pytorch", "features/passes/snpe", "getstarted/installation", "getstarted/quickstart_bert_example", "getstarted/quickstart_examples", "getstarted/quickstart_resnet_example", "index", "overview/olive", "overview/options", "overview/quicktour", "tutorials/advanced_users", "tutorials/azure_arc", "tutorials/azureml_scripts", "tutorials/configure_data", "tutorials/configure_metrics", "tutorials/configure_model_path", "tutorials/configure_pass", "tutorials/configure_systems"], "filenames": ["api/engine.rst", "api/evaluator.rst", "api/metric.rst", "api/models.rst", "api/passes.rst", "api/resource_path.rst", "api/search-algorithms.rst", "api/systems.rst", "examples.md", "extending_olive/design.md", "extending_olive/how_to_add_optimization_pass.md", "features/azureml_integration.md", "features/custom_scripts.md", "features/huggingface_model_optimization.md", "features/model_transformations_and_optimizations.rst", "features/packaging_output_models.md", "features/passes/onnx.md", "features/passes/openvino.md", "features/passes/pytorch.md", "features/passes/snpe.md", "getstarted/installation.md", "getstarted/quickstart_bert_example.md", "getstarted/quickstart_examples.rst", "getstarted/quickstart_resnet_example.md", "index.rst", "overview/olive.md", "overview/options.md", "overview/quicktour.md", "tutorials/advanced_users.md", "tutorials/azure_arc.md", "tutorials/azureml_scripts.md", "tutorials/configure_data.rst", "tutorials/configure_metrics.rst", "tutorials/configure_model_path.md", "tutorials/configure_pass.rst", "tutorials/configure_systems.rst"], "titles": ["Engine", "OliveEvaluator", "Metric", "OliveModels", "Passes", "ResourcePath", "SearchAlgorithms", "OliveSystems", "Acceleration on CPU", "Design", "How to add new optimization Pass", "Azure ML integration", "Custom Scripts", "Huggingface Model Optimization", "Model Transformations and Optimizations", "Packaging Olive artifacts", "ONNX", "OpenVINO", "PyTorch", "SNPE", "Installation", "BERT optimization with PTQ on CPU", "Quickstart Examples", "ResNet optimization with PTQ on CPU", "Welcome to Olive\u2019s documentation!", "Olive", "Olive Options", "Quick Tour", "Advanced User Tour", "Self-hosted Kubernetes cluster", "Azure ML scripts", "How To Configure Data", "How To Configure Metric", "How To Set Model Path", "How To Configure Pass", "How To Configure System"], "terms": {"class": [0, 1, 2, 3, 4, 5, 12, 26, 31, 32, 34, 35], "oliv": [0, 1, 2, 3, 4, 5, 6, 7, 9, 10, 12, 13, 14, 16, 18, 20, 21, 23, 28, 30, 31, 32, 33, 34, 35], "config": [0, 3, 4, 5, 9, 10, 11, 16, 17, 18, 19, 27, 28, 29, 30, 32, 33, 34, 35], "dict": [0, 3, 4, 5, 7, 10, 12, 13, 26], "str": [0, 2, 3, 4, 5, 7, 10, 12, 15, 26, 31], "ani": [0, 3, 4, 5, 7, 9, 10, 16, 26, 27, 31, 34], "none": [0, 2, 3, 4, 5, 7, 26, 32], "search_strategi": [0, 15, 26, 28], "host": [0, 9, 10, 13, 15, 24, 26, 35], "olivesystem": [0, 24, 26, 28], "target": [0, 4, 9, 15, 16, 25, 26, 27, 32, 35], "evaluator_config": [0, 28], "oliveevaluatorconfig": [0, 28], "execution_provid": [0, 10, 15, 26, 32], "list": [0, 2, 3, 4, 5, 6, 7, 9, 13, 16, 20, 26, 27, 28, 31, 34, 35], "sourc": [0, 1, 2, 3, 4, 5, 7, 19], "The": [0, 3, 4, 5, 6, 7, 9, 10, 13, 14, 15, 16, 17, 18, 19, 25, 26, 27, 28, 30, 31, 33, 35], "execut": [0, 4, 10, 16, 19, 26], "regist": [0, 9, 26, 33], "step": [0, 4, 10, 16, 26, 27, 29], "It": [0, 4, 9, 10, 15, 16, 17, 18, 19, 26, 27, 29, 34, 35], "facilit": 0, "evalu": [0, 1, 2, 4, 11, 12, 13, 15, 27, 31, 32, 35], "output": [0, 4, 5, 9, 10, 12, 14, 15, 16, 18, 21, 23, 25, 26, 27, 28, 31], "model": [0, 4, 5, 8, 9, 10, 15, 18, 24, 25, 31, 32, 35], "us": [0, 4, 6, 9, 10, 12, 13, 15, 16, 17, 18, 19, 20, 25, 26, 27, 28, 29, 31, 32, 33, 34, 35], "provid": [0, 4, 5, 9, 10, 12, 13, 14, 15, 16, 18, 19, 24, 25, 26, 27, 28, 30, 31, 32, 34], "criteria": 0, "produc": [0, 14, 27], "": [0, 4, 12, 18, 25, 26, 27, 28, 31, 34], "pass_typ": 0, "type": [0, 2, 3, 4, 5, 6, 7, 9, 10, 11, 12, 13, 15, 16, 17, 18, 19, 26, 27, 28, 31, 33, 34, 35], "pass": [0, 11, 12, 14, 15, 16, 17, 18, 19, 21, 23, 24, 29, 31, 35], "disable_search": [0, 10, 16, 26, 34], "fals": [0, 3, 4, 6, 7, 10, 12, 15, 26, 28, 32, 34, 35], "name": [0, 2, 4, 5, 6, 10, 11, 12, 13, 15, 16, 17, 26, 27, 28, 30, 31, 32], "clean_run_cach": [0, 26], "bool": [0, 3, 4, 6, 7, 10, 15], "output_nam": [0, 3, 4, 5, 11, 19, 26, 27, 28, 33], "configur": [0, 4, 5, 6, 9, 12, 13, 15, 24, 26, 27, 28, 33], "so": [0, 4, 10, 16], "could": [0, 4, 10, 14, 26, 27], "instanti": [0, 28], "later": 0, "run": [0, 4, 9, 11, 15, 16, 17, 18, 19, 26, 27, 29, 30, 31, 32, 35], "input_model_config": 0, "modelconfig": [0, 3, 28], "data_root": [0, 10, 26], "packaging_config": [0, 15, 26], "packagingconfig": [0, 15, 26], "output_dir": [0, 4, 15, 26], "evaluate_input_model": [0, 26], "true": [0, 2, 4, 5, 6, 10, 15, 16, 19, 26, 32, 34, 35], "all": [0, 4, 9, 16, 25, 26, 27, 28, 31, 34], "input": [0, 4, 9, 10, 11, 13, 14, 15, 16, 18, 19, 31], "one": [0, 4, 9, 10, 15, 18, 19, 27, 28, 30, 32], "more": [0, 4, 5, 6, 9, 13, 16, 17, 18, 19, 26, 27, 28, 31, 35], "candid": [0, 9, 15, 21, 23], "paramet": [0, 4, 5, 6, 9, 10, 16, 17, 18, 19, 26, 28, 31, 34], "data": [0, 4, 10, 13, 16, 24, 28, 32], "root": [0, 10, 11, 26, 33], "packag": [0, 9, 10, 21, 23, 24, 26, 27], "i": [0, 3, 4, 5, 6, 9, 10, 12, 13, 14, 16, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 29, 30, 31, 32, 33, 34, 35], "zip": [0, 15, 19], "file": [0, 4, 5, 10, 11, 12, 16, 17, 18, 19, 26, 27, 28, 29, 30], "directori": [0, 4, 9, 12, 19, 21, 23, 26, 27, 31, 32, 33], "save": [0, 4, 21, 23, 26, 33], "prefix": [0, 15, 26], "return": [0, 4, 9, 10, 12, 13, 26, 28, 32], "search": [0, 4, 6, 10, 14, 26, 28, 34], "strategi": [0, 4, 26], "ar": [0, 3, 4, 5, 6, 7, 9, 10, 11, 14, 15, 16, 17, 18, 25, 26, 28, 30, 35], "order": [0, 4, 15, 25, 26, 28], "thei": [0, 4, 15, 26, 31], "were": [0, 4, 15, 26], "final": [0, 4, 9, 10, 26, 27, 28], "_": [0, 31], "acceleratorspec": [0, 10], "_model": 0, "onnx": [0, 4, 9, 14, 15, 17, 19, 21, 23, 26, 27, 28, 35], "json": [0, 12, 15, 23, 27, 28, 30, 31, 32, 34, 35], "result": [0, 4, 16, 18, 26, 28, 32], "_metric": 0, "footprint": [0, 16, 17], "find": [0, 9, 16, 26, 27], "configbas": [0, 2], "can": [0, 4, 9, 10, 11, 12, 13, 14, 15, 16, 18, 19, 20, 21, 23, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35], "assign": [0, 4, 34], "dictionari": [0, 4, 9, 26, 27, 28, 31, 34], "kei": [0, 4, 12, 26, 31], "correspond": [0, 4, 16, 19, 21, 23], "field": [0, 2, 4, 5, 7, 10, 31, 32], "pydant": [0, 2, 4, 5, 7], "set": [0, 2, 4, 5, 7, 9, 10, 15, 16, 19, 24, 25, 26, 27, 28, 29, 34, 35], "searchstrategyconfig": 0, "systemconfig": [0, 7], "azureml_client_config": [0, 7], "azuremlclientconfig": [0, 5, 7], "cache_dir": [0, 15, 26, 28], "path": [0, 3, 4, 5, 7, 10, 11, 12, 19, 24, 26, 29, 30, 31], "cach": [0, 4, 9, 15, 26, 28], "clean_cach": [0, 15, 26], "clean_evaluation_cach": [0, 26], "plot_pareto_fronti": [0, 26], "execution_ord": [0, 9, 15, 26, 28], "requir": [0, 2, 4, 5, 7, 9, 10, 15, 16, 18, 25, 26, 28, 30, 31, 33, 34], "search_algorithm": [0, 9, 15, 26, 28], "search_algorithm_config": [0, 15, 26], "output_model_num": [0, 26], "int": [0, 3, 4, 5, 6, 7, 10, 26], "stop_when_goals_met": [0, 26], "max_it": [0, 26], "max_tim": [0, 26], "system": [0, 10, 11, 24], "system_config": [0, 7], "systemtyp": 0, "targetuserconfig": [0, 7], "create_system": [0, 7], "olive_evalu": [0, 1, 28], "metric": [0, 4, 9, 12, 15, 24, 26, 27, 28], "backend": [2, 4, 13, 26], "torch_metr": [2, 26], "sub_typ": [2, 12, 13, 26, 27, 28, 32], "submetr": 2, "user_config": [2, 12, 26, 28, 32], "data_config": [2, 4, 31], "dataconfig": [2, 4, 31], "get_sub_type_info": 2, "info_nam": 2, "no_priority_filt": 2, "callback": 2, "function": [2, 4, 12, 13, 24, 26, 28, 31, 32], "lambda": 2, "valu": [2, 4, 5, 7, 9, 10, 12, 15, 16, 18, 26, 28, 30, 31, 32, 34], "an": [2, 3, 4, 5, 7, 9, 10, 13, 14, 15, 16, 17, 18, 19, 25, 26, 27, 28, 30, 31, 32, 33, 35], "enumer": [2, 5, 7], "accuraci": [2, 4, 9, 12, 13, 16, 25, 26, 27], "custom": [2, 4, 8, 9, 16, 18, 24, 26], "latenc": [2, 4, 8, 9, 17, 25, 26, 27, 28], "throughput": [2, 9, 25, 26], "accuracy_scor": [2, 12, 26, 32], "auroc": [2, 12, 26, 32], "f1_score": [2, 12, 26, 32], "perplex": [2, 18], "precis": [2, 4, 14, 17, 18, 26], "recal": [2, 26], "avg": [2, 26, 27, 28, 32], "max": [2, 4, 5, 12, 26, 32], "min": [2, 4, 26, 32], "p50": 2, "p75": 2, "p90": 2, "p95": 2, "p99": 2, "p999": 2, "float": [2, 4, 16, 17, 26], "follow": [3, 4, 5, 6, 7, 9, 10, 11, 12, 13, 15, 19, 20, 25, 26, 27, 29, 31, 32], "avail": [3, 4, 5, 6, 7, 10, 11, 16, 19, 20, 26, 28, 31, 34, 35], "onnxmodel": [3, 4, 10, 17, 26], "model_path": [3, 11, 26, 27, 28, 33], "resourcepath": [3, 4, 24], "resourcepathconfig": [3, 4, 26], "onnx_file_nam": 3, "inference_set": [3, 26], "use_ort_extens": 3, "model_attribut": 3, "model_compon": 3, "model_component_nam": 3, "repres": [3, 10, 16, 28], "multipl": [3, 14, 15, 16, 25, 32], "compon": [3, 9, 16, 25, 26], "whisper": [3, 8, 13, 16], "exampl": [3, 4, 21, 23, 25, 27, 28, 31, 32, 34, 35], "composit": [3, 4], "ha": [3, 4, 9, 10, 20, 26, 28, 33], "encod": [3, 16], "decod": [3, 4, 13, 16], "collect": [3, 12], "model_name_pattern": 3, "num_rank": 3, "openvinomodel": [3, 4, 26], "pytorchmodel": [3, 4, 13, 17, 26, 27, 28, 31, 33], "model_file_format": 3, "modelfileformat": 3, "pytorch_entire_model": 3, "model_load": [3, 26], "callabl": [3, 4, 10, 26], "model_script": [3, 13, 26], "script_dir": [3, 4, 13, 26, 31], "io_config": [3, 13, 26, 27, 28], "ioconfig": [3, 26], "dummy_inputs_func": [3, 13, 26], "hf_config": [3, 4, 13, 26, 31], "hfconfig": 3, "adapter_path": 3, "snpemodel": [3, 4, 26], "input_nam": [3, 4, 19, 26, 27, 28, 31], "input_shap": [3, 4, 17, 19, 26, 27, 28, 31], "output_shap": [3, 19], "kwarg": [3, 26], "each": [4, 5, 6, 9, 10, 15, 16, 26, 27, 28, 31], "descript": [4, 5, 6, 10, 16, 26, 27], "option": [4, 5, 6, 9, 10, 11, 16, 24, 27, 28, 31, 34, 35], "convert": [4, 14, 16, 17, 18, 19, 26, 28, 31], "pytorch": [4, 8, 14, 16, 21, 26, 27, 28], "torch": [4, 16, 18, 27], "export": [4, 15, 26], "cpu": [4, 10, 11, 13, 17, 18, 20, 22, 24, 26, 27, 35], "compositeonnxmodel": 4, "distributedonnxmodel": 4, "contain": [4, 9, 10, 17, 19, 26, 31, 34, 35], "user": [4, 9, 10, 13, 15, 16, 24, 26, 31, 34, 35], "script": [4, 10, 24, 26, 28, 29, 31], "depend": [4, 10, 26, 28, 34, 35], "default_valu": [4, 5, 6, 10, 16, 34], "searchable_valu": [4, 10, 16, 34], "user_script": [4, 13, 16, 17, 18, 19, 26, 28, 31, 32, 34], "other": [4, 5, 9, 10, 13, 16, 26, 28, 29, 31, 34], "which": [4, 9, 10, 13, 15, 16, 17, 18, 26, 27, 28, 31], "object": [4, 9, 10, 12, 26, 27, 28], "import": [4, 10, 12, 21, 23, 27, 28, 31, 32, 34, 35], "from": [4, 6, 9, 10, 13, 15, 16, 18, 19, 21, 23, 26, 27, 28, 30, 31, 32, 33, 34, 35], "thi": [4, 6, 9, 10, 11, 12, 13, 15, 16, 17, 18, 19, 20, 21, 23, 24, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35], "target_opset": [4, 16, 26, 27, 28], "version": [4, 5, 11, 15, 17, 19, 20, 26, 33], "default": [4, 5, 8, 9, 10, 15, 16, 18, 20, 26, 27, 28, 29, 30, 31, 34], "ai": [4, 8, 17, 19, 20, 26, 27, 35], "opset": [4, 16], "13": [4, 16, 26, 27, 28], "use_dynamo_export": 4, "whether": [4, 10, 16, 26, 34], "dynamo_export": 4, "api": [4, 5, 25, 28], "use_devic": 4, "devic": [4, 9, 16, 17, 26, 27, 32, 35], "convers": [4, 9, 14, 21, 23, 27, 28], "e": [4, 13, 15, 16, 20, 26], "g": [4, 13, 15, 16], "cuda": [4, 8, 10, 27], "If": [4, 5, 6, 10, 11, 15, 16, 20, 26, 27, 30, 31, 32, 33], "specifi": [4, 10, 11, 12, 13, 15, 16, 18, 26, 27, 29, 30, 32, 33], "distributedpytorchmodel": 4, "torch_dtyp": 4, "dtype": 4, "cast": [4, 16], "befor": [4, 14, 16, 26, 29, 30, 31], "float32": [4, 16], "float16": [4, 14, 26], "parallel_job": 4, "number": [4, 5, 6, 15, 16, 26, 30, 31], "parallel": 4, "job": [4, 5, 26, 29], "0": [4, 11, 12, 15, 16, 17, 18, 26, 27, 28, 30, 32, 35], "disabl": 4, "save_as_external_data": 4, "serial": 4, "tensor": [4, 16, 18, 27], "separ": [4, 12, 20, 26], "instead": [4, 16, 26], "directli": [4, 12, 27, 28, 31, 33], "larg": [4, 18, 26], "2gb": 4, "mai": [4, 16, 20, 27, 28, 29], "forc": 4, "extern": 4, "regardless": 4, "all_tensors_to_one_fil": 4, "effect": 4, "onli": [4, 10, 12, 13, 15, 16, 18, 26, 30, 31, 32, 35], "external_data_nam": 4, "model_path_nam": 4, "size_threshold": 4, "threshold": [4, 26], "size": [4, 16, 17, 26, 30, 32], "when": [4, 6, 9, 12, 15, 17, 26, 28, 34, 35], "To": [4, 9, 10, 16, 23, 24], "everi": [4, 25], "raw": [4, 31], "1024": 4, "convert_attribut": 4, "non": 4, "attribut": [4, 12, 26], "latest": [4, 16, 20], "20": [4, 19, 26, 32], "optim": [4, 8, 9, 17, 18, 22, 24, 25, 26, 27, 28, 31], "fuse": [4, 16, 26], "node": [4, 16, 26, 30], "transform": [4, 17, 18, 21, 24, 26, 27], "base": [4, 10, 13, 15, 16, 18, 26, 31], "scenario": [4, 15, 16, 25, 26], "where": [4, 11, 12, 15, 16, 18, 26, 27, 30], "runtim": [4, 16, 19, 21, 26], "doe": [4, 6, 16, 26, 31], "appli": [4, 14, 16, 18, 26, 28], "load": [4, 12, 13, 16, 18, 19, 26, 27, 28, 31, 32], "time": [4, 16, 17, 26, 30], "onnxruntim": [4, 10, 15, 20, 26, 35], "model_typ": [4, 16, 26], "includ": [4, 10, 15, 16, 27, 31], "bert": [4, 8, 13, 16, 22, 26, 31], "gpt2": 4, "bert_tf": 4, "tf2onnx": 4, "bert_kera": 4, "keras2onnx": 4, "unet": 4, "vae": 4, "clip": 4, "stabl": [4, 6, 8, 20], "diffus": [4, 8], "num_head": [4, 26], "attent": 4, "head": [4, 13], "hidden_s": [4, 26], "hidden": 4, "optimization_opt": 4, "turn": [4, 9], "off": 4, "some": [4, 9, 10, 16, 24, 26, 34, 35], "fusion": [4, 16], "fusion_opt": 4, "fusionopt": 4, "opt_level": 4, "graph": [4, 16, 26], "level": [4, 16, 26, 27, 33], "1": [4, 6, 7, 11, 12, 13, 15, 16, 19, 26, 27, 28, 31, 32, 33, 35], "basic": [4, 16, 26], "2": [4, 7, 12, 15, 16, 18, 26, 27, 28, 30, 31, 32, 35], "extend": [4, 26], "99": [4, 15], "categor": [4, 10], "use_gpu": 4, "flag": [4, 29, 30], "gpu": [4, 7, 10, 16, 18, 20, 24, 35], "infer": [4, 16, 17, 18, 19, 25, 26, 32, 33], "only_onnxruntim": 4, "python": [4, 5, 9, 12, 15, 19, 20, 21, 23, 26, 27, 28, 30, 31, 32, 34], "might": [4, 9, 19], "caus": [4, 26], "failur": 4, "symbol": 4, "shape": [4, 16, 26, 27], "condit": [4, 10, 16], "parent": [4, 10], "support": [4, 9, 10, 12, 13, 15, 16, 17, 18, 26, 27, 28, 33, 34, 35], "half": 4, "keep_io_typ": [4, 16], "keep": 4, "origin": [4, 17, 18], "force_fp32_op": 4, "oper": [4, 5, 9, 16, 17, 26], "force_fp32_nod": 4, "force_fp16_input": 4, "even": 4, "convert_float_to_float16": [4, 16], "tool": [4, 16, 19, 25, 26], "prefer": [4, 14], "them": [4, 12, 16, 19, 30, 32], "use_gqa": 4, "replac": [4, 6, 9, 26], "multiheadattent": 4, "groupqueryattent": 4, "input_int32": 4, "int32": [4, 16, 26], "data_dir": [4, 11, 12, 17, 19, 26, 28, 31, 32], "sampl": [4, 6, 9, 15, 26], "pathlib": [4, 5], "resource_path": [4, 5], "dataloader_func": [4, 12, 16, 17, 19, 26, 28, 32, 34], "dataload": [4, 12, 26, 28, 31], "given": [4, 25, 26, 31], "batch": [4, 26, 31, 32], "dataloader_func_kwarg": 4, "keyword": [4, 26, 28, 31], "argument": [4, 26, 28, 30, 31], "batch_siz": [4, 12, 13, 16, 26, 28, 31, 32], "comput": [4, 9, 16, 17, 19, 26, 29, 30, 35], "input_typ": [4, 26, 31], "select": [4, 9, 16, 23, 27, 29], "tune": [4, 9, 10, 14, 18, 21, 25, 26, 28], "process": [4, 8, 12, 14, 17, 18, 19, 26, 27, 28, 31], "cpu_cor": 4, "core": [4, 9, 19, 25], "thread": [4, 16], "io_bind": 4, "enabl": [4, 20, 25, 26], "iobind": 4, "enable_cuda_graph": 4, "providers_list": 4, "framework": [4, 16, 17, 19, 25, 28], "cpuexecutionprovid": [4, 10, 15], "execution_mode_list": 4, "between": [4, 5, 9, 11, 16, 26], "opt_level_list": 4, "trt_fp16_enabl": 4, "fp16": [4, 18], "mode": [4, 16, 20, 26, 27], "tensorrt": [4, 8, 10, 18], "intra_thread_num_list": 4, "intra": 4, "test": [4, 20, 26, 31], "inter_thread_num_list": 4, "inter": 4, "extra_session_config": [4, 15], "extra": [4, 20, 35], "session": 4, "dure": [4, 17, 18, 20, 26], "onnxconvert": 4, "common": [4, 7, 35], "see": [4, 16, 26, 27, 28, 29], "http": [4, 5, 6, 20, 26, 31], "doc": [4, 26], "perform": [4, 9, 14, 15, 17, 18, 21, 26], "html": [4, 6], "min_positive_v": 4, "constant": [4, 24], "against": 4, "1e": 4, "07": 4, "max_finite_v": 4, "10000": 4, "should": [4, 10, 12, 26, 29, 30, 31], "left": 4, "disable_shape_inf": 4, "skip": [4, 16, 26], "op_block_list": [4, 16], "op": [4, 14, 26], "leav": [4, 16], "node_block_list": 4, "mix": [4, 14], "simplifiedlayernorm": [4, 16], "skipsimplifiedlayernorm": [4, 16], "relu": [4, 16], "add": [4, 15, 16, 24, 33], "atol": 4, "absolut": [4, 26], "toler": 4, "check": [4, 16, 17, 18, 19, 34], "06": 4, "dynam": [4, 16, 26, 27], "quantiz": [4, 8, 9, 14, 21, 23, 26, 27, 28], "quant_mod": 4, "weight_typ": [4, 26, 28, 34], "weight": [4, 16, 17, 18, 19], "both": [4, 16, 26, 28, 32, 33], "static": [4, 10, 16, 26], "qint8": 4, "sign": 4, "8": [4, 7, 16, 17, 18, 19], "bit": [4, 16, 17, 18, 19], "integ": [4, 16, 17], "quint8": [4, 26, 28, 34], "unsign": 4, "op_types_to_quant": 4, "nodes_to_quant": 4, "nodes_to_exclud": 4, "exclud": [4, 16, 26], "per_channel": [4, 16, 34], "per": [4, 9], "channel": 4, "tip": 4, "reduce_rang": [4, 34], "reduc": [4, 16, 17, 18, 25], "rang": [4, 16], "7": 4, "improv": [4, 14, 16, 17, 18, 24, 26, 32], "vnni": 4, "machin": [4, 9, 11, 16, 19, 30, 33, 35], "especi": 4, "quant_preprocess": 4, "prepar": [4, 25], "pre": [4, 8, 14, 18, 24, 34, 35], "sigmoid": 4, "nnapi": 4, "activationsymmetr": 4, "symmetr": 4, "calibr": [4, 16], "activ": [4, 9, 13, 16, 17, 18, 20], "weightsymmetr": 4, "enablesubgraph": 4, "subgraph": 4, "current": [4, 9, 13, 24, 26, 31, 33], "forcequantizenoinputcheck": 4, "By": [4, 15, 26], "latent": 4, "like": [4, 5, 16, 18, 26, 27, 30, 31], "maxpool": 4, "transpos": 4, "do": [4, 10, 26], "alreadi": 4, "alwai": [4, 26], "gener": [4, 6, 15, 16, 19, 26, 33], "also": [4, 9, 10, 14, 15, 16, 18, 19, 20, 26, 27, 31, 33, 34, 35], "behavior": 4, "matmulconstbonli": 4, "matmul": 4, "const": 4, "b": [4, 16, 18], "conditionaldefault": [4, 10], "olive_invalid_param_valu": 4, "extra_opt": 4, "pair": 4, "pleas": [4, 5, 10, 11, 13, 16, 17, 18, 19, 20, 21, 23, 26, 27, 29, 32, 35], "refer": [4, 5, 6, 11, 13, 16, 17, 18, 19, 20, 25, 26, 27, 28, 31, 32, 35], "github": [4, 20, 31], "com": [4, 5, 11, 20, 26, 31, 35], "microsoft": [4, 5, 11, 20, 26, 29, 31, 35], "blob": [4, 31], "main": [4, 9, 20, 31], "py": [4, 12, 13, 16, 17, 18, 19, 23, 26, 28, 31, 32, 34], "detail": [4, 5, 6, 11, 13, 16, 17, 18, 19, 25, 26, 27, 28, 29, 35], "about": [4, 6, 10, 16, 17, 18, 19, 26, 27, 28], "overwritten": 4, "dataset": [4, 12, 16, 18, 26, 27, 31], "For": [4, 10, 11, 13, 15, 16, 26, 27, 28, 31, 34], "local": [4, 5, 7, 9, 11, 27, 28], "calibrate_method": 4, "method": [4, 10, 16, 17, 18, 26], "minmax": 4, "entropi": 4, "calibrationmethod": 4, "percentil": 4, "16": [4, 16, 18, 28, 32], "avoid": [4, 27, 31], "quant_format": 4, "qoper": 4, "format": [4, 14, 15, 16, 26], "qdq": 4, "insert": [4, 14, 17], "quantizelinear": 4, "dequantizelinear": 4, "activation_typ": 4, "specialparamvalu": 4, "invalid": [4, 10], "techniqu": [4, 9, 10, 16, 18, 25, 26, 27, 28], "ignor": [4, 5, 10, 26, 30, 31], "olive_ignored_param_valu": 4, "intel": [4, 8, 17, 26, 31], "neural": [4, 8, 17, 19, 26], "compressor": [4, 8, 26], "approach": [4, 17, 18, 28], "onnxrt_trt_ep": 4, "onnxrt_cuda_ep": 4, "domain": 4, "auto": [4, 9, 10, 28], "cv": 4, "object_detect": 4, "nlp": 4, "recommendation_system": 4, "adaptor": 4, "specif": [4, 9, 12, 13, 14, 16, 19, 25, 26, 28, 34], "differ": [4, 9, 12, 15, 16, 18, 19, 26, 27, 32, 35], "automat": [4, 11, 12, 13, 16, 26, 33], "explicitli": [4, 33], "overrid": [4, 26, 28], "detect": 4, "recip": 4, "below": 4, "smooth_quant": 4, "smooth": 4, "quant": 4, "smooth_quant_arg": 4, "fast_bias_correct": 4, "fast": 4, "bia": 4, "correct": 4, "weight_correct": 4, "gemm_to_matmul": 4, "gemm": 4, "valid": [4, 10, 13, 26, 31], "graph_optimization_level": [4, 15], "disable_al": 4, "enable_bas": 4, "enable_extend": 4, "enable_al": 4, "first_conv_or_matmul_quant": 4, "first": [4, 9, 21, 23, 26, 28, 31], "conv": 4, "last_conv_or_matmul_quant": 4, "last": [4, 27, 29], "pre_post_process_quant": 4, "preprocess": [4, 31], "postprocess": 4, "add_qdq_pair_to_weight": 4, "optypes_to_exclude_output_qu": 4, "don": [4, 10, 16, 19, 26], "t": [4, 10, 16, 19, 26, 33], "optyp": 4, "dedicated_qdq_pair": 4, "dedic": 4, "quant_level": 4, "allow": [4, 11, 17, 25], "choos": [4, 16], "3": [4, 5, 15, 17, 18, 19, 26, 27, 28, 31], "conserv": 4, "combin": [4, 9, 34], "master": 4, "tuning_strategi": 4, "md": 4, "algorithm": [4, 6, 17, 18, 26], "excluded_precis": 4, "empti": [4, 26], "fp32": 4, "bf16": 4, "int8": [4, 16], "you": [4, 11, 12, 13, 15, 16, 19, 20, 21, 23, 24, 26, 27, 28, 29, 30, 32, 33, 34], "want": [4, 16, 20, 26, 27, 28, 31], "tuning_criterion": 4, "instanc": [4, 5, 16, 26, 28, 30], "tuningcriterion": 4, "In": [4, 9, 11, 16, 26, 28, 29, 31, 32], "strategy_kwarg": 4, "timeout": [4, 5, 26], "max_trial": 4, "5": [4, 5, 10, 15, 18, 23, 26, 28], "awar": [4, 14, 25, 26], "weight_only_config": 4, "inc": 4, "op_type_dict": 4, "4": [4, 7, 10, 12, 16, 18, 26], "group_siz": 4, "scheme": 4, "asym": 4, "rtn": 4, "calibration_sampling_s": 4, "100": 4, "weight_onli": 4, "post": [4, 8, 12, 14, 26, 31], "command": [4, 20, 21, 23, 26, 27, 28, 29, 30], "tool_command": [4, 16], "invok": [4, 10], "tool_command_arg": [4, 16], "prepostprocessor": [4, 16], "schema": 4, "would": [4, 27, 31], "imag": [4, 16], "data_typ": [4, 16], "uint8": [4, 16], "num_byt": [4, 16], "append_pre_post_processing_op": 4, "prepostprocessorinput": [4, 16], "beam": [4, 14], "olivemodel": [4, 10, 13, 24, 28], "no_repeat_ngram_s": [4, 16], "ngram": 4, "occur": 4, "onc": [4, 16, 17], "use_forced_decoder_id": 4, "decoder_input_id": 4, "ort": [4, 14], "fine": [4, 16, 18], "hug": [4, 18], "face": [4, 18], "target_modul": 4, "modul": [4, 8, 10, 12, 18, 31], "use_ort_train": 4, "orttrain": 4, "ortmodule_onnx_opset_vers": 4, "bfloat16": [4, 18], "lora_r": 4, "dimens": [4, 16, 26], "64": [4, 15], "lora_alpha": [4, 18], "alpha": 4, "scale": [4, 16, 30], "lora_dropout": 4, "dropout": 4, "probabl": 4, "layer": [4, 18], "modules_to_sav": 4, "apart": 4, "trainabl": [4, 18], "checkpoint": 4, "train": [4, 8, 14, 25, 26], "allow_tf32": 4, "tf32": 4, "amper": 4, "speed": [4, 16], "up": [4, 25], "inform": [4, 6, 10, 17, 18, 28], "org": 4, "note": [4, 10, 17, 18, 20, 26, 28, 29, 31, 33], "tensorfloat": 4, "32": [4, 16, 17, 26, 27, 28], "train_data_config": [4, 18], "eval_data_config": 4, "eval_dataset_s": 4, "split": [4, 13, 26, 31], "eval": 4, "otherwis": [4, 26], "need": [4, 9, 13, 14, 16, 20, 26, 28, 31, 32], "either": [4, 12, 16, 26], "posit": [4, 26, 28, 31], "smaller": 4, "than": [4, 16, 28], "training_arg": [4, 18], "double_qu": 4, "nest": 4, "again": 4, "quant_typ": [4, 18], "fp4": 4, "nf4": [4, 18], "compute_dtyp": [4, 18], "same": [4, 9, 10, 15, 16, 19, 26], "trainer": 4, "trainingargu": 4, "recommend": [4, 15, 19, 20], "seed": [4, 6, 15, 26], "42": 4, "random": [4, 6, 9, 26], "initi": [4, 5, 9, 26, 28], "data_se": 4, "sampler": [4, 6], "paged_adamw_32bit": 4, "per_device_train_batch_s": 4, "per_device_eval_batch_s": 4, "gradient_accumulation_step": 4, "updat": [4, 24, 28, 31], "accumul": 4, "gradient": [4, 18], "backward": 4, "max_step": 4, "total": 4, "weight_decai": 4, "l2": 4, "decai": 4, "rate": 4, "adamw": 4, "learning_r": [4, 18], "0002": [4, 18], "learn": [4, 5, 11, 16, 17, 18, 19, 25, 30, 33], "gradient_checkpoint": 4, "lr_scheduler_typ": 4, "schedul": 4, "better": [4, 26], "cosin": 4, "advantag": [4, 18, 28], "analysi": 4, "warmup_ratio": 4, "03": 4, "fraction": 4, "warmup": 4, "logging_step": 4, "10": [4, 26], "two": [4, 9, 16, 34], "log": [4, 26], "evaluation_strategi": 4, "Will": 4, "eval_step": 4, "group_by_length": 4, "group": [4, 5, 6, 26, 30], "roughli": 4, "length": 4, "togeth": [4, 9, 16, 26], "report_to": 4, "integr": [4, 16, 24, 25], "report": 4, "dir": 4, "temp": 4, "extra_arg": 4, "create_training_arg": 4, "train_data_dir": 4, "val_data_dir": 4, "train_dataloader_func": [4, 18], "train_batch_s": 4, "training_loop_func": [4, 18], "loop": [4, 8, 18], "ptl_modul": [4, 18], "lightningmodul": 4, "lightn": [4, 8, 18], "wai": [4, 16, 18, 31, 32], "encapsul": 4, "logic": [4, 12], "relat": [4, 26], "readthedoc": [4, 6], "io": [4, 6, 13, 29], "en": [4, 5, 6], "lightning_modul": 4, "ptl_data_modul": [4, 18], "lightningdatamodul": 4, "datamodul": 4, "num_epoch": [4, 18, 23], "maximum": [4, 26, 30], "epoch": 4, "num_step": 4, "do_valid": 4, "over": [4, 6, 9, 26, 28], "after": [4, 5, 14, 21, 23, 26], "modules_to_fus": 4, "qconfig_func": 4, "creat": [4, 5, 9, 10, 12, 16, 20, 26, 28, 30, 31, 35], "qconfig": [4, 18], "qat": [4, 8, 18, 26], "ao": 4, "logger": 4, "pytorch_lightn": 4, "iter": [4, 9, 26], "checkpoint_path": 4, "tensorflow": [4, 16, 17, 19, 26], "openvino": [4, 8, 14, 26, 27], "tupl": 4, "fed": 4, "defin": [4, 9, 11, 12, 13, 16, 31, 32, 34], "comma": 4, "enclos": 4, "parenthes": 4, "squar": 4, "bracket": 4, "227": 4, "extra_config": 4, "mo": 4, "usag": [4, 18, 24], "instruct": [4, 11, 19, 25, 29], "openvino_docs_mo_dg_deep_learning_model_optimizer_devguid": 4, "pot_introduct": 4, "engine_config": [4, 17, 28], "pot": 4, "ieengin": 4, "metric_func": [4, 12, 26, 32], "A": [4, 9, 30, 35], "calcul": [4, 16, 32], "pipelin": [4, 9, 21, 26], "determin": [4, 32], "defaultquant": [4, 17], "param": [4, 10, 16, 17, 31], "preset": [4, 17], "stat_subset_s": [4, 17], "500": 4, "snpe": [4, 14, 26, 27, 31], "dlc": [4, 19, 26], "sdk": [4, 14, 26], "tensorflowmodel": [4, 17], "must": [4, 9, 10, 16, 26, 31, 34, 35], "member": 4, "inputtyp": 4, "input_layout": 4, "layout": [4, 16], "inputlayout": 4, "develop": [4, 13, 16, 19, 20, 25], "qualcomm": [4, 8, 19], "site": 4, "addit": [4, 16, 17, 20, 27, 31, 33], "form": [4, 13, 16, 26], "arg_nam": 4, "arg_valu": 4, "take": [4, 10, 13, 18, 25, 26, 27, 28, 29, 31, 32, 34], "snpedataload": 4, "use_enhanced_quant": 4, "enhanc": 4, "featur": [4, 20, 26, 27, 28, 35], "have": [4, 9, 11, 12, 15, 16, 19, 26, 27, 32, 35], "long": [4, 26], "tail": 4, "distribut": [4, 17], "being": 4, "enable_htp": [4, 19], "pack": 4, "htp": 4, "htp_soc": 4, "soc": 4, "offlin": [4, 16], "tools_snp": 4, "target_devic": [4, 17], "snpedevic": 4, "12": [4, 7, 26], "arxiv": 4, "ab": 4, "2301": 4, "00774": 4, "bloom": [4, 18], "gpt_neox": 4, "llama": 4, "opt": [4, 18], "sparsiti": [4, 18], "n": 4, "m": [4, 9, 19, 21, 23, 26, 27, 28, 30], "semi": [4, 18], "structur": [4, 6, 9, 16, 18, 26], "pattern": [4, 16, 18], "nvidia": 4, "blog": [4, 18], "acceler": [4, 7, 10, 16, 18, 19, 24, 25, 35], "blocksiz": 4, "adapt": [4, 18], "mask": 4, "128": [4, 31], "percdamp": 4, "percentag": [4, 26], "averag": 4, "hessian": 4, "diagon": 4, "dampen": 4, "01": [4, 12, 26, 32], "min_lay": 4, "prune": [4, 16, 18], "id": [4, 5, 11, 26, 27, 30, 33], "max_lay": 4, "layer_name_filt": 4, "whose": 4, "string": [4, 5, 10, 16, 26], "compute_devic": 4, "etc": [4, 10, 16, 26, 27], "affect": 4, "expect": [4, 19], "most": [4, 16, 25], "sequenc": 4, "nn": [4, 18], "linear": [4, 18], "huggingfac": [4, 24, 26, 27, 31], "spars": [4, 18], "applic": [4, 18], "entir": [4, 26], "instal": [4, 10, 21, 23, 24, 27, 29, 35], "compil": [4, 18, 25], "we": [4, 9, 13, 19, 20, 25, 26, 27, 28, 29, 31, 34], "best": [4, 9, 16, 21, 23, 25, 26, 28, 32, 34, 35], "vai_q_onnx": 4, "viti": [4, 8, 26], "input_nod": 4, "start": [4, 25, 28, 31], "output_nod": 4, "end": 4, "optimize_model": 4, "deprec": 4, "soon": [4, 28], "NOT": 4, "chang": [4, 27], "make": [4, 25, 29], "debug": 4, "loss": 4, "difficult": 4, "use_external_data_format": 4, "nonoverflow": 4, "minms": 4, "need_layer_fus": 4, "enable_dpu": 4, "dpu": [4, 24], "addqdqpairtoweight": 4, "remain": 4, "point": [4, 6, 9, 10, 16, 17, 19, 26], "optimum": [4, 26], "optimummodel": 4, "14": [4, 16], "no_post_process": 4, "main_export": 4, "merg": [4, 16, 18, 26], "decoder_model": 4, "its": [4, 5, 6, 9, 16, 17, 18, 19, 26, 32], "decoder_with_past_model": 4, "via": [4, 11, 26], "librari": [4, 16, 18, 26], "strict": 4, "decoder_with_past": 4, "strictli": 4, "case": [4, 16, 21, 23, 26, 31, 34], "ad": [4, 12], "match": 4, "resourc": [5, 7, 11, 26, 30, 33], "azureml_datastor": [5, 11, 26, 33], "azureml_job_output": [5, 11, 33], "azureml_model": [5, 11, 33], "azuremlregistrymodel": 5, "azureml_registry_model": [5, 11, 33], "folder": [5, 10, 11, 15, 26], "string_nam": [5, 33], "azureml": [5, 7, 9, 29, 30], "azureml_cli": [5, 11, 33], "client": 5, "subscription_id": [5, 11, 26, 30, 33], "azur": [5, 24, 33, 35], "subscript": [5, 26, 30], "aml_config_path": [5, 30], "resource_group": [5, 11, 26, 30, 33], "workspace_nam": [5, 11, 26, 30, 33], "workspac": [5, 9, 11, 26, 29, 30, 33, 35], "read_timeout": [5, 26], "60": [5, 18], "read": [5, 17, 26], "second": [5, 9, 26, 30], "request": [5, 26], "max_operation_retri": [5, 26], "retri": [5, 26], "creation": [5, 26], "download": [5, 11, 26, 29, 35], "operation_retry_interv": [5, 26], "interv": [5, 26], "doubl": [5, 26], "default_auth_param": [5, 26], "auth": [5, 26], "u": [5, 24, 28], "ident": [5, 26, 35], "defaultazurecredenti": [5, 26], "view": 5, "get_workspace_config": 5, "get": [5, 25], "create_cli": 5, "mlclient": [5, 33], "create_registry_cli": 5, "registry_nam": [5, 11, 33], "datastor": [5, 26], "datastore_nam": [5, 11, 26, 33], "relative_path": [5, 11, 26, 33], "rel": [5, 11, 26, 33], "datastore_url": 5, "url": [5, 26], "job_nam": 5, "exhaust": [6, 9, 26, 28], "grid": 6, "space": [6, 9, 10, 26, 27, 34], "searcher": 6, "without": [6, 9, 26], "num_sampl": [6, 15, 26], "suggest": [6, 24], "rng": 6, "with_replac": 6, "tpe": [6, 9, 15, 26], "tree": [6, 9, 26], "parzen": [6, 9, 26], "estim": [6, 9, 26], "optuna": 6, "tpesampl": 6, "underneath": 6, "multivari": 6, "decompos": 6, "docker": [7, 9, 19, 26, 29], "pythonenviron": [7, 9, 35], "local_docker_config": [7, 35], "localdockerconfig": [7, 35], "is_dev": 7, "olive_managed_env": [7, 35], "requirements_fil": [7, 35], "image_nam": [7, 35], "base_imag": [7, 11, 26, 35], "requirements_file_path": 7, "dockerfil": [7, 35], "build_context_path": [7, 35], "build_arg": 7, "run_param": 7, "aml_comput": [7, 11, 26, 35], "aml_docker_config": [7, 11, 26, 35], "azuremldockerconfig": [7, 35], "instance_count": 7, "conda_file_path": [7, 11, 26, 35], "python_environment_path": [7, 35], "environment_vari": 7, "prepend_to_path": 7, "python_environ": [7, 35], "system_alia": 7, "azurend12ssystem": 7, "classvar": 7, "num_cpu": 7, "num_gpu": 7, "sku": 7, "standard_nd12": 7, "system_typ": 7, "azurend24rssystem": 7, "24": 7, "standard_nd24r": 7, "azurend24ssystem": 7, "standard_nd24": 7, "azurend6ssystem": 7, "6": [7, 10], "standard_nd6": 7, "azurend96a100system": 7, "96": 7, "standard_nd96amsr_a100_v4": 7, "azurend96asystem": 7, "standard_nd96asr_v4": 7, "azurendv2system": [7, 26, 35], "40": 7, "standard_nd40rs_v2": 7, "surfaceprosystem1796": 7, "surface_pro_1796": 7, "surfaceprosystem1807": 7, "surface_pro_1807": 7, "ptq": [8, 13, 14, 22], "resnet": [8, 22, 26, 27, 28], "cifar10": 8, "hw": [8, 16], "squeezenet": 8, "directml": [8, 10, 20], "dolli": 8, "v2": 8, "incept": 8, "amd": [8, 26], "section": [9, 11, 26, 31, 33], "discuss": 9, "concept": 9, "compos": [9, 25, 26, 31], "modular": 9, "construct": 9, "workflow": [9, 11, 12, 13, 15, 21, 23, 26, 27, 28, 33], "respons": [9, 27], "achiev": [9, 16], "sai": [9, 10, 12], "respect": [9, 16], "emploi": 9, "desir": [9, 16, 20, 25, 27, 28], "pareto": [9, 26], "frontier": [9, 26], "multi": 9, "meet": [9, 31], "goal": [9, 12, 16, 26, 32], "diagram": 9, "illustr": 9, "relationship": 9, "build": [9, 20, 25], "block": 9, "searchabl": [9, 10, 16, 26, 34], "chose": [9, 28, 34], "possibl": [9, 16, 27, 34], "fix": [9, 16, 19, 34], "certain": [9, 16, 34], "environ": [9, 16, 19, 20, 27, 29], "o": [9, 19, 27, 35], "hardwar": [9, 14, 16, 17, 25, 26, 27, 35], "spec": [9, 35], "platform": [9, 16, 17, 35], "ep": [9, 35], "thu": [9, 16, 26, 35], "ideal": 9, "deploy": [9, 25], "three": [9, 27, 34], "localsystem": [9, 26, 28, 35], "azuremlsystem": [9, 35], "dockersystem": [9, 35], "tp": 9, "token": [9, 13], "along": [9, 10, 18, 27, 31], "own": [9, 12, 13, 16, 25, 26, 31, 32, 33], "manag": [9, 11, 26, 30, 35], "intermedi": 9, "maintain": 9, "consist": 9, "sub": 9, "joint": [9, 15, 26, 28], "independ": 9, "trial": 9, "been": [9, 16, 28], "implement": [9, 13, 16, 17, 18, 19, 25, 26], "randomli": 9, "ampl": 9, "simpl": [10, 27, 28], "interfac": [10, 16, 28, 30], "introduc": [10, 13, 15, 16, 24], "newoptimizationtrick": 10, "_requires_user_script": 10, "next": [10, 15], "_default_config": 10, "passconfigparam": 10, "dataclass": 10, "hold": 10, "accelerator_typ": 10, "cudaexecutionprovid": 10, "belong": 10, "dml": 10, "sinc": [10, 15, 25, 34], "type_": 10, "categori": 10, "accept": [10, 27], "upload": 10, "normal": 10, "searchparamet": 10, "staticmethod": 10, "def": [10, 12, 13, 31, 32], "accelerator_spec": 10, "param1": 10, "param2": 10, "param3": 10, "objectclass": 10, "param4": 10, "union": 10, "paramcategori": 10, "anoth": [10, 14, 16, 26], "param5": 10, "param6": 10, "_run_for_config": 10, "engin": [10, 11, 15, 18, 19, 24, 25, 29, 35], "while": [10, 16, 25], "receiv": [10, 14, 26], "self": [10, 11, 12, 24], "output_model_path": 10, "document": [11, 13, 16, 19, 25, 26, 29, 32, 33, 34, 35], "outlin": 11, "discov": 11, "how": [11, 13, 16, 24, 25, 27, 28, 29], "asset": [11, 26, 30], "within": 11, "aml": [11, 26], "model_nam": [11, 13, 26, 31, 33], "model_vers": 11, "my_subscription_id": [11, 33], "my_resource_group": [11, 33], "my_workspac": [11, 33], "my_datastor": [11, 33], "model_dir": [11, 33], "my_model": [11, 33], "pt": [11, 27, 28, 33], "job_id": [11, 33], "my_job_id": [11, 33], "my_output_nam": [11, 33], "aml_system": [11, 26, 35], "cluster": [11, 24, 26, 35], "mcr": [11, 26, 35], "openmpi4": [11, 26, 35], "ubuntu20": [11, 26, 35], "04": [11, 19, 26, 35], "conda": [11, 20, 26, 35], "yaml": [11, 26, 35], "Then": [11, 21, 23, 29, 31], "link": [11, 18], "setup": [11, 21, 23, 27], "kubernet": [11, 24], "offer": [11, 25], "sever": [11, 26, 29, 31], "assist": [11, 26], "abil": [12, 16], "write": [12, 16, 17, 28], "task": [12, 13, 26, 27, 31], "your": [12, 13, 16, 20, 26, 27, 28, 29, 30, 32, 33], "post_processing_func": [12, 26, 32], "evaluate_func": [12, 26, 32], "openvinoquant": [12, 17, 26], "my_script": [12, 13], "mydataload": 12, "__init__": 12, "__len__": 12, "__getitem__": 12, "create_dataload": [12, 16, 17, 26, 28, 32], "post_process": [12, 26, 31, 32], "here": [12, 13, 16, 27, 28, 29, 31, 32], "prioriti": [12, 13, 15, 26, 28, 32], "degrad": [12, 26, 32], "metric_config": [12, 26, 28, 32], "multiclass": [12, 26, 32], "num_class": [12, 26, 32], "append": [12, 14], "sy": 12, "interpret": 12, "place": [12, 26], "let": [12, 27, 28, 31, 34], "my_modul": 12, "my_olive_project": 12, "print": 12, "my_val": 12, "describ": [13, 16, 18, 26, 27, 32, 33, 34, 35], "simpli": [13, 21, 23, 31], "hub": [13, 26, 33], "uncas": [13, 26, 31], "text": [13, 26, 31], "classif": [13, 26, 31], "found": [13, 18, 26, 28], "just": [13, 27, 31], "processor": 13, "simplifi": [13, 25], "experi": [13, 16, 25], "demonstr": 13, "under": [13, 24, 26, 31], "glue": [13, 26, 31], "full": [13, 16, 27, 34], "data_nam": [13, 26, 31], "subset": [13, 26, 31], "mrpc": [13, 26, 31], "input_col": [13, 26, 31], "sentence1": [13, 26, 31], "sentence2": [13, 26, 31], "label_col": [13, 26, 31], "label": [13, 26, 31], "huggingface_metr": [13, 26], "f1": [13, 26], "input_model": [13, 26, 27, 28, 31, 33], "code": [13, 15, 18, 20, 21, 23, 27], "model_class": [13, 26], "whisperforconditionalgener": 13, "openai": 13, "medium": 13, "encoder_decoder_init": 13, "get_encdec_io_config": 13, "component_func": [13, 26], "get_encoder_decoder_init": 13, "encoder_decoder_init_dummy_input": 13, "get_dec_io_config": 13, "get_decod": 13, "decoder_dummy_input": 13, "dummi": [13, 26, 31], "complet": [13, 26, 27, 28, 31], "known": [14, 19, 27], "typic": [14, 27], "goe": 14, "through": [14, 16, 18, 26], "seri": 14, "readi": [14, 25, 28], "product": 14, "design": [14, 24], "nativ": 14, "lora": 14, "qlora": 14, "sparsegpt": 14, "torchtrtconvers": 14, "prerequisit": 14, "There": [15, 16, 24, 26, 31, 35], "onnxruntimepackag": 15, "top": [15, 33], "rank": [15, 18, 32], "histori": 15, "c": [15, 16, 18, 26, 30], "k": 15, "bestcandidatemodel_1": 15, "bestcandidatemodel_2": 15, "bestcandidatemodel_k": 15, "metric_1": 15, "metric_2": 15, "metric_3": 15, "sort": 15, "firstli": 15, "lower": [15, 18], "bestcandidatemodel": 15, "session_opt": [15, 26], "execution_mod": 15, "null": [15, 26, 31], "inter_op_num_thread": 15, "intra_op_num_thread": 15, "program": 15, "languag": 15, "And": 15, "snippet": 15, "packagingtyp": 15, "outputmodel": 15, "export_in_mlflow_format": 15, "mlflow": 15, "common_evalu": [15, 26, 27, 31], "local_system": [15, 26, 28, 35], "open": [16, 17], "cross": [16, 17], "flexibl": 16, "variou": [16, 25, 27], "onnxconvers": [16, 26, 27, 28], "besid": [16, 31], "exist": [16, 30], "onnxopversionconvers": [16, 26], "similar": 16, "abov": [16, 18, 21, 23, 26, 31], "onnxmodeloptim": [16, 26], "involv": 16, "singl": [16, 25, 31], "cost": 16, "analyz": 16, "identifi": [16, 27], "argmax": 16, "isn": 16, "inferenc": 16, "tensorproto": 16, "int64": [16, 31], "yet": 16, "orttransformersoptim": [16, 26], "capabl": 16, "These": [16, 28, 35], "done": 16, "appendprepostprocessingop": 16, "superresolut": 16, "output_format": 16, "png": 16, "use_audio_decod": 16, "leverag": [16, 31], "extens": [16, 18, 25], "placehold": 16, "__model_input__": 16, "__model_output__": 16, "iomapentri": 16, "ycbcrtopixel": 16, "bgr": 16, "io_map": 16, "y1_uint8": 16, "cb1_uint8": 16, "cr1_uint8": 16, "knowledg": 16, "built": [16, 26], "onnxextens": 16, "convertimagetobgr": 16, "incompat": 16, "web": 16, "kind": [16, 29], "proper": 16, "exactli": 16, "resiz": 16, "resize_to": 16, "input_index": 16, "dim_index": 16, "centercrop": 16, "height": 16, "width": [16, 18], "pixelstoycbcr": 16, "imagebytestofloat": 16, "unsqueez": 16, "ax": [16, 26], "squeez": 16, "floattoimagebyt": 16, "output_index": 16, "multipli": 16, "convertbgrtoimag": 16, "image_format": 16, "insertbeamsearch": 16, "chain": [16, 25], "compress": [16, 25], "deep": [16, 17, 18, 19, 31], "memori": [16, 17, 18], "zero": 16, "mean": [16, 26], "increas": [16, 18, 26], "usual": 16, "higher": [16, 26], "compar": 16, "ones": 16, "call": [16, 18, 28, 31, 32], "consolid": 16, "onnxquant": [16, 26, 28, 34], "hyperparamet": 16, "onnxdynamicquant": [16, 26, 27], "onnxstaticquant": [16, 26], "across": [16, 25], "popular": [16, 31], "mxnet": 16, "varieti": [16, 28], "power": 16, "distil": 16, "As": 16, "driven": 16, "friendli": 16, "focus": [16, 17], "easi": [16, 25], "strive": 16, "reach": 16, "everywher": 16, "incquant": [16, 26], "incdynamicquant": [16, 26], "incstaticquant": [16, 26], "complex": 16, "network": [16, 17, 19, 26], "less": 16, "bandwidth": 16, "faster": 16, "effici": [16, 17, 18, 25], "vitisaiquant": [16, 26], "olivepass": 16, "glue_calibration_read": [16, 34], "d": [16, 30], "onnx_quant": [16, 26, 34], "out": [16, 17, 18, 19, 29, 34], "high": 16, "ortperftun": [16, 26], "cover": 16, "knob": 16, "decreas": 16, "onnxfloattofloat16": 16, "wrap": 16, "onnxconverter_common": 16, "often": 16, "expos": [16, 26], "stage": 16, "stand": [16, 17], "alon": 16, "suit": 16, "architectur": 16, "reli": 16, "suitabl": [16, 25], "mani": 16, "grain": 16, "control": 16, "give": [16, 24, 26, 28], "poor": 16, "ortmixedprecis": 16, "minim": 16, "retain": 16, "layernorm": 16, "skiplayernorm": 16, "fastgelu": 16, "embedlayernorm": 16, "toolkit": 17, "visual": 17, "deploi": [17, 29], "anywher": 17, "2022": 17, "pip": [17, 27, 35], "dev": 17, "openvinoconvers": [17, 26], "ir": [17, 26], "now": [17, 27, 28], "uniform": 17, "move": 17, "help": [17, 30], "well": [17, 25, 26], "arithmet": 17, "undergo": 17, "actual": 17, "transit": 17, "happen": 17, "stat_requests_numb": 17, "eval_requests_numb": 17, "300": 17, "low": 18, "freez": 18, "inject": 18, "decomposit": 18, "matric": 18, "paper": 18, "peft": 18, "hftrainingargu": 18, "finetun": 18, "backpropag": 18, "frozen": 18, "pretrain": 18, "fake": 18, "quantizationawaretrain": [18, 26], "ptldatamodul": 18, "ptlmodul": 18, "create_train_dataload": 18, "gpt": 18, "shot": 18, "unstructur": 18, "upto": 18, "175b": 18, "176b": 18, "neglig": 18, "trtmodul": 18, "torch_tensorrt": 18, "regular": 18, "snapdragon": 19, "softwar": 19, "hexagon": 19, "dsp": 19, "variabl": [19, 29], "snpe_root": 19, "limit": 19, "ubuntu": 19, "18": 19, "work": [19, 25, 26, 35], "bin": 19, "sh": 19, "snpeconvers": [19, 26], "299": 19, "inceptionv3": 19, "predict": [19, 26], "reshape_1": 19, "1001": 19, "snpequant": [19, 26], "represent": 19, "32bit": 19, "bias": 19, "create_quant_dataload": 19, "virtual": 20, "public": 20, "pypi": 20, "With": [20, 25], "git": 20, "egg": 20, "contribut": 20, "clone": 20, "repositori": [20, 21, 23], "cd": 20, "tuner": [21, 23], "go": [21, 23], "quickstart": [21, 23, 24], "necessari": [21, 23, 27, 35], "r": [21, 23], "txt": [21, 23, 31, 35], "accord": [21, 23], "olive_run": [21, 23, 27, 28], "bert_auto": 21, "prepare_model_data": 23, "resnet_ptq_cpu": 23, "releas": 24, "feel": 24, "free": [24, 29], "feedback": 24, "quick": [24, 28], "tour": 24, "npu": 24, "artifact": [24, 26], "ml": [24, 25, 33, 35], "new": [24, 29, 30], "advanc": 24, "oliveevalu": 24, "searchalgorithm": 24, "industri": 25, "lead": [25, 28], "cloud": 25, "edg": 25, "constraint": 25, "consider": 25, "vendor": 25, "fragment": 25, "effort": 25, "util": 25, "toolchain": 25, "aim": 25, "aggreg": 25, "autom": 25, "unifi": 25, "serv": [25, 31], "easili": [25, 26, 31], "plugin": 25, "innov": 25, "e2": 25, "solut": 25, "organ": [25, 26, 29, 31], "overview": [25, 29], "introduct": 25, "guidanc": 25, "tutori": [25, 27, 29], "authent": 26, "credenti": 26, "account": 26, "too": 26, "small": 26, "3000": 26, "sometim": [26, 31], "hang": 26, "stream": 26, "issu": 26, "fail": 26, "exclude_managed_identity_credenti": 26, "4000": 26, "item": [26, 31], "insensit": [26, 34], "loader": [26, 28], "dynamic_ax": [26, 28], "index": 26, "axi": 26, "distilbert": 26, "from_pretrain": 26, "past": 26, "causal": 26, "lm": 26, "info": 26, "Such": 26, "distilbertforsequenceclassif": 26, "hfcompon": 26, "futur": 26, "mnli": 26, "page": [26, 29], "column": 26, "component_kwarg": 26, "pre_process_data": [26, 31], "align_label": 26, "align": 26, "label2id": 26, "co": 26, "nlp_process": 26, "model_config_path": 26, "model_config": 26, "fetch": 26, "tabl": [26, 31], "load_pytorch_origin_model": 26, "concaten": 26, "On": 26, "hand": 26, "home": [26, 29, 35], "line": [26, 28, 30], "config_fil": 26, "cifar": 26, "resourcegroup": 26, "alia": [26, 35], "uniqu": [26, 31], "among": 26, "torchmetr": 26, "auc": 26, "subtyp": 26, "cannot": 26, "accuracysubtyp": [26, 32], "latencysubtyp": [26, 28, 32], "throughputsubtyp": [26, 32], "measur": [26, 27], "load_param": 26, "word_length": 26, "compute_param": 26, "pred": [26, 32], "result_kei": 26, "extract": 26, "9": 26, "higher_is_bett": [26, 32], "boolean": 26, "percent": [26, 32], "minimum": [26, 30], "model_framework": 26, "Not": 26, "func_kwarg": 26, "abl": [26, 29], "signatur": 26, "pars": 26, "our": 26, "enable_profil": 26, "definit": 26, "pass_flow": 26, "decid": [26, 34], "overridden": [26, 34], "clean": 26, "onnxtransformersoptim": 26, "snpetoonnxconvers": 26, "xilinx": 26, "optimumconvers": 26, "optimummerg": 26, "onnx_convers": [26, 27], "resnet_calibration_read": [26, 28], "transformers_optim": 26, "768": 26, "qualifi": 26, "stop": 26, "met": 26, "store": [26, 27, 33], "plot": 26, "log_severity_level": [26, 27], "verbos": [26, 27], "warn": 26, "error": 26, "fatal": 26, "ort_log_severity_level": 26, "ort_py_log_severity_level": 26, "log_to_fil": 26, "guid": [27, 28], "focu": 27, "simplest": 27, "my_model_acceleration_descript": 27, "equival": 27, "temporari": 27, "tempdir": 27, "reason": 27, "disk": 27, "permiss": 27, "special": 27, "cuda_visible_devic": 27, "linux": 27, "window": 27, "know": 27, "term": 27, "look": [27, 28, 31], "slightli": 27, "assum": 27, "my_evalu": 27, "my_latency_metr": 27, "user_provided_info": 28, "user_provided_info_json_fil": 28, "individu": 28, "standard": 28, "parse_obj": 28, "metrictyp": [28, 32], "latency_metr": [28, 32], "warmup_num": 28, "repeat_test_num": 28, "sleep_num": 28, "handl": 28, "onnx_conversion_config": 28, "quantization_config": 28, "best_execut": 28, "sure": 29, "k8": 29, "kube": 29, "kubeconfig": 29, "access": 29, "lunch": 29, "infrastructur": 29, "fill": 29, "minut": 29, "verif": 29, "attach": 29, "coupl": 30, "indic": 30, "mutual": 30, "exclus": 30, "delet": 30, "compute_nam": 30, "vm_size": 30, "vm": 30, "locat": 30, "min_nod": 30, "max_nod": 30, "idle_time_before_scale_down": 30, "idl": 30, "down": 30, "120": 30, "aml_config": 30, "open_llama_sparsegpt_gpu": 31, "dataset_1": 31, "dataset_2": 31, "letter": 31, "underscor": 31, "common_pass": 31, "dive": 31, "dummydatacontain": 31, "dummy_data_config_templ": 31, "params_config": 31, "input_id": 31, "attention_mask": 31, "token_type_id": 31, "huggingfacecontain": 31, "huggingface_data_config_templ": 31, "task_typ": 31, "rawdatacontain": 31, "raw_data": 31, "224": 31, "input_dir": 31, "input_suffix": 31, "input_order_fil": 31, "input_ord": 31, "datacontain": 31, "four": 31, "load_dataset": 31, "local_dataset": 31, "simple_dataset": 31, "huggingface_dataset": 31, "raw_dataset": 31, "pre_process": 31, "huggingface_pre_process": 31, "ner_huggingface_preprocess": 31, "text_generation_huggingface_pre_process": 31, "post_process_data": 31, "text_classification_post_process": 31, "ner_post_process": 31, "text_generation_post_process": 31, "default_dataload": 31, "skip_dataload": 31, "no_auto_batch_dataload": 31, "_huggingface_dataset": 31, "data_fil": 31, "_huggingface_pre_process": 31, "max_sampl": 31, "_text_classification_post_process": 31, "_default_dataload": 31, "show": 31, "rewrit": 31, "But": 31, "user_dir": 31, "customized_huggingface_dataset": 31, "registri": 31, "register_dataset": 31, "_output": 31, "register_pre_process": 31, "customized_huggingface_pre_process": 31, "register_post_process": 31, "customized_post_process": 31, "register_dataload": 31, "customized_dataload": 31, "inception_post_process": 31, "inception_snpe_qualcomm_npu": 31, "l8": 31, "l10": 31, "json_config": 31, "inception_config": 31, "l14": 31, "l16": 31, "dummy_dataset_dataroot": 31, "unit_test": 31, "test_data_root": 31, "l31": 31, "l107": 31, "conflict": 31, "metricgo": 32, "accuracy_metr": 32, "throughput_metr": 32, "accuracy_custom": 32, "eval_accuraci": 32, "altern": 32, "yourself": 32, "model_output": 32, "logit": 32, "omit": [32, 33], "my_model_dir": 33, "curat": 33, "doesn": 33, "still": 33, "fulli": 34, "thing": 34, "redund": 34, "olive_pass": 34, "create_pass_from_dict": 34, "localtargetuserconfig": 35, "docker_config": 35, "azuremltargetuserconfig": 35, "docker_system": 35, "mnist_requir": 35, "dockertargetuserconfig": 35, "virtualenv": 35, "myenv": 35, "pythonenvironmentsystem": 35, "python_environment_system": 35, "pythonenvironmenttargetuserconfig": 35}, "objects": {"olive.azureml.azureml_client": [[5, 0, 1, "", "AzureMLClientConfig"]], "olive.azureml.azureml_client.AzureMLClientConfig": [[5, 1, 1, "", "aml_config_path"], [5, 2, 1, "", "create_client"], [5, 2, 1, "", "create_registry_client"], [5, 1, 1, "", "default_auth_params"], [5, 2, 1, "", "get_workspace_config"], [5, 1, 1, "", "max_operation_retries"], [5, 1, 1, "", "operation_retry_interval"], [5, 1, 1, "", "read_timeout"], [5, 1, 1, "", "resource_group"], [5, 1, 1, "", "subscription_id"], [5, 1, 1, "", "workspace_name"]], "olive.engine": [[0, 3, 1, "", "Engine"], [0, 0, 1, "", "EngineConfig"]], "olive.engine.Engine": [[0, 2, 1, "", "register"], [0, 2, 1, "", "run"]], "olive.engine.EngineConfig": [[0, 1, 1, "", "azureml_client_config"], [0, 1, 1, "", "cache_dir"], [0, 1, 1, "", "clean_cache"], [0, 1, 1, "", "clean_evaluation_cache"], [0, 1, 1, "", "evaluator"], [0, 1, 1, "", "execution_providers"], [0, 1, 1, "", "host"], [0, 1, 1, "", "packaging_config"], [0, 1, 1, "", "plot_pareto_frontier"], [0, 1, 1, "", "search_strategy"], [0, 1, 1, "", "target"]], "olive.evaluator.metric": [[2, 3, 1, "", "AccuracySubType"], [2, 3, 1, "", "LatencySubType"], [2, 0, 1, "", "Metric"], [2, 0, 1, "", "MetricGoal"], [2, 3, 1, "", "MetricType"], [2, 3, 1, "", "ThroughputSubType"]], "olive.evaluator.metric.AccuracySubType": [[2, 4, 1, "", "ACCURACY_SCORE"], [2, 4, 1, "", "AUROC"], [2, 4, 1, "", "F1_SCORE"], [2, 4, 1, "", "PERPLEXITY"], [2, 4, 1, "", "PRECISION"], [2, 4, 1, "", "RECALL"]], "olive.evaluator.metric.LatencySubType": [[2, 4, 1, "", "AVG"], [2, 4, 1, "", "MAX"], [2, 4, 1, "", "MIN"], [2, 4, 1, "", "P50"], [2, 4, 1, "", "P75"], [2, 4, 1, "", "P90"], [2, 4, 1, "", "P95"], [2, 4, 1, "", "P99"], [2, 4, 1, "", "P999"]], "olive.evaluator.metric.Metric": [[2, 1, 1, "", "backend"], [2, 1, 1, "", "data_config"], [2, 2, 1, "", "get_sub_type_info"], [2, 1, 1, "", "name"], [2, 1, 1, "", "sub_types"], [2, 1, 1, "", "type"], [2, 1, 1, "", "user_config"]], "olive.evaluator.metric.MetricGoal": [[2, 1, 1, "", "type"], [2, 1, 1, "", "value"]], "olive.evaluator.metric.MetricType": [[2, 4, 1, "", "ACCURACY"], [2, 4, 1, "", "CUSTOM"], [2, 4, 1, "", "LATENCY"], [2, 4, 1, "", "THROUGHPUT"]], "olive.evaluator.metric.ThroughputSubType": [[2, 4, 1, "", "AVG"], [2, 4, 1, "", "MAX"], [2, 4, 1, "", "MIN"], [2, 4, 1, "", "P50"], [2, 4, 1, "", "P75"], [2, 4, 1, "", "P90"], [2, 4, 1, "", "P95"], [2, 4, 1, "", "P99"], [2, 4, 1, "", "P999"]], "olive.evaluator.olive_evaluator": [[1, 3, 1, "", "OliveEvaluator"], [0, 0, 1, "", "OliveEvaluatorConfig"]], "olive.evaluator.olive_evaluator.OliveEvaluatorConfig": [[0, 1, 1, "", "metrics"]], "olive.model": [[3, 3, 1, "", "CompositeOnnxModel"], [3, 3, 1, "", "CompositePyTorchModel"], [3, 3, 1, "", "DistributedOnnxModel"], [3, 3, 1, "", "DistributedPyTorchModel"], [3, 3, 1, "", "ModelConfig"], [3, 3, 1, "", "ONNXModel"], [3, 3, 1, "", "OpenVINOModel"], [3, 3, 1, "", "PyTorchModel"], [3, 3, 1, "", "SNPEModel"]], "olive.passes.pytorch.lora": [[4, 0, 1, "", "HFTrainingArguments"]], "olive.passes.pytorch.lora.HFTrainingArguments": [[4, 2, 1, "", "create_training_args"], [4, 1, 1, "", "data_seed"], [4, 1, 1, "", "eval_steps"], [4, 1, 1, "", "evaluation_strategy"], [4, 1, 1, "", "extra_args"], [4, 1, 1, "", "gradient_accumulation_steps"], [4, 1, 1, "", "gradient_checkpointing"], [4, 1, 1, "", "group_by_length"], [4, 1, 1, "", "learning_rate"], [4, 1, 1, "", "logging_steps"], [4, 1, 1, "", "lr_scheduler_type"], [4, 1, 1, "", "max_steps"], [4, 1, 1, "", "optim"], [4, 1, 1, "", "output_dir"], [4, 1, 1, "", "per_device_eval_batch_size"], [4, 1, 1, "", "per_device_train_batch_size"], [4, 1, 1, "", "report_to"], [4, 1, 1, "", "seed"], [4, 1, 1, "", "warmup_ratio"], [4, 1, 1, "", "weight_decay"]], "olive.resource_path": [[5, 3, 1, "", "ResourceType"]], "olive.resource_path.ResourceType": [[5, 4, 1, "", "AzureMLDatastore"], [5, 4, 1, "", "AzureMLJobOutput"], [5, 4, 1, "", "AzureMLModel"], [5, 4, 1, "", "AzureMLRegistryModel"], [5, 4, 1, "", "LocalFile"], [5, 4, 1, "", "LocalFolder"], [5, 4, 1, "", "StringName"]], "olive.strategy.search_strategy": [[0, 3, 1, "", "SearchStrategy"], [0, 0, 1, "", "SearchStrategyConfig"]], "olive.strategy.search_strategy.SearchStrategyConfig": [[0, 1, 1, "", "execution_order"], [0, 1, 1, "", "max_iter"], [0, 1, 1, "", "max_time"], [0, 1, 1, "", "output_model_num"], [0, 1, 1, "", "search_algorithm"], [0, 1, 1, "", "search_algorithm_config"], [0, 1, 1, "", "stop_when_goals_met"]], "olive.systems.azureml": [[7, 0, 1, "", "AzureMLDockerConfig"], [7, 3, 1, "", "AzureMLSystem"]], "olive.systems.azureml.AzureMLDockerConfig": [[7, 1, 1, "", "base_image"], [7, 1, 1, "", "build_context_path"], [7, 1, 1, "", "conda_file_path"], [7, 1, 1, "", "dockerfile"]], "olive.systems.common": [[7, 3, 1, "", "SystemType"]], "olive.systems.common.SystemType": [[7, 4, 1, "", "AzureML"], [7, 4, 1, "", "Docker"], [7, 4, 1, "", "Local"], [7, 4, 1, "", "PythonEnvironment"]], "olive.systems.docker": [[7, 3, 1, "", "DockerSystem"], [7, 0, 1, "", "LocalDockerConfig"]], "olive.systems.docker.LocalDockerConfig": [[7, 1, 1, "", "base_image"], [7, 1, 1, "", "build_args"], [7, 1, 1, "", "build_context_path"], [7, 1, 1, "", "dockerfile"], [7, 1, 1, "", "image_name"], [7, 1, 1, "", "requirements_file_path"], [7, 1, 1, "", "run_params"]], "olive.systems.local": [[7, 3, 1, "", "LocalSystem"]], "olive.systems.python_environment": [[7, 3, 1, "", "PythonEnvironmentSystem"]], "olive.systems": [[7, 5, 0, "-", "system_alias"]], "olive.systems.system_alias": [[7, 3, 1, "", "AzureND12SSystem"], [7, 3, 1, "", "AzureND24RSSystem"], [7, 3, 1, "", "AzureND24SSystem"], [7, 3, 1, "", "AzureND6SSystem"], [7, 3, 1, "", "AzureND96A100System"], [7, 3, 1, "", "AzureND96ASystem"], [7, 3, 1, "", "AzureNDV2System"], [7, 3, 1, "", "SurfaceProSystem1796"], [7, 3, 1, "", "SurfaceProSystem1807"]], "olive.systems.system_alias.AzureND12SSystem": [[7, 4, 1, "", "accelerators"], [7, 4, 1, "", "num_cpus"], [7, 4, 1, "", "num_gpus"], [7, 4, 1, "", "sku"], [7, 4, 1, "", "system_type"]], "olive.systems.system_alias.AzureND24RSSystem": [[7, 4, 1, "", "accelerators"], [7, 4, 1, "", "num_cpus"], [7, 4, 1, "", "num_gpus"], [7, 4, 1, "", "sku"], [7, 4, 1, "", "system_type"]], "olive.systems.system_alias.AzureND24SSystem": [[7, 4, 1, "", "accelerators"], [7, 4, 1, "", "num_cpus"], [7, 4, 1, "", "num_gpus"], [7, 4, 1, "", "sku"], [7, 4, 1, "", "system_type"]], "olive.systems.system_alias.AzureND6SSystem": [[7, 4, 1, "", "accelerators"], [7, 4, 1, "", "num_cpus"], [7, 4, 1, "", "num_gpus"], [7, 4, 1, "", "sku"], [7, 4, 1, "", "system_type"]], "olive.systems.system_alias.AzureND96A100System": [[7, 4, 1, "", "accelerators"], [7, 4, 1, "", "num_cpus"], [7, 4, 1, "", "num_gpus"], [7, 4, 1, "", "sku"], [7, 4, 1, "", "system_type"]], "olive.systems.system_alias.AzureND96ASystem": [[7, 4, 1, "", "accelerators"], [7, 4, 1, "", "num_cpus"], [7, 4, 1, "", "num_gpus"], [7, 4, 1, "", "sku"], [7, 4, 1, "", "system_type"]], "olive.systems.system_alias.AzureNDV2System": [[7, 4, 1, "", "accelerators"], [7, 4, 1, "", "num_cpus"], [7, 4, 1, "", "num_gpus"], [7, 4, 1, "", "sku"], [7, 4, 1, "", "system_type"]], "olive.systems.system_alias.SurfaceProSystem1796": [[7, 4, 1, "", "accelerators"], [7, 4, 1, "", "sku"], [7, 4, 1, "", "system_type"]], "olive.systems.system_alias.SurfaceProSystem1807": [[7, 4, 1, "", "accelerators"], [7, 4, 1, "", "sku"], [7, 4, 1, "", "system_type"]], "olive.systems.system_config": [[7, 0, 1, "", "AzureMLTargetUserConfig"], [7, 0, 1, "", "DockerTargetUserConfig"], [7, 0, 1, "", "LocalTargetUserConfig"], [7, 0, 1, "", "PythonEnvironmentTargetUserConfig"], [7, 0, 1, "", "SystemConfig"]], "olive.systems.system_config.AzureMLTargetUserConfig": [[7, 1, 1, "", "aml_compute"], [7, 1, 1, "", "aml_docker_config"], [7, 1, 1, "", "azureml_client_config"], [7, 1, 1, "", "instance_count"], [7, 1, 1, "", "is_dev"], [7, 1, 1, "", "olive_managed_env"], [7, 1, 1, "", "requirements_file"], [7, 1, 1, "", "resources"]], "olive.systems.system_config.DockerTargetUserConfig": [[7, 1, 1, "", "is_dev"], [7, 1, 1, "", "local_docker_config"], [7, 1, 1, "", "olive_managed_env"], [7, 1, 1, "", "requirements_file"]], "olive.systems.system_config.LocalTargetUserConfig": [[7, 1, 1, "", "accelerators"]], "olive.systems.system_config.PythonEnvironmentTargetUserConfig": [[7, 1, 1, "", "environment_variables"], [7, 1, 1, "", "olive_managed_env"], [7, 1, 1, "", "prepend_to_path"], [7, 1, 1, "", "python_environment_path"], [7, 1, 1, "", "requirements_file"]], "olive.systems.system_config.SystemConfig": [[7, 1, 1, "", "config"], [7, 2, 1, "", "create_system"], [7, 1, 1, "", "type"]], "": [[4, 6, 1, "cmdoption-arg-ActivationSymmetric", "ActivationSymmetric"], [4, 6, 1, "cmdoption-arg-AddQDQPairToWeight", "AddQDQPairToWeight"], [4, 6, 1, "cmdoption-arg-EnableSubgraph", "EnableSubgraph"], [4, 6, 1, "cmdoption-arg-ForceQuantizeNoInputCheck", "ForceQuantizeNoInputCheck"], [4, 6, 1, "cmdoption-arg-MatMulConstBOnly", "MatMulConstBOnly"], [4, 6, 1, "cmdoption-arg-WeightSymmetric", "WeightSymmetric"], [4, 6, 1, "cmdoption-arg-activation_type", "activation_type"], [4, 6, 1, "cmdoption-arg-algorithms", "algorithms"], [4, 6, 1, "cmdoption-arg-all_tensors_to_one_file", "all_tensors_to_one_file"], [4, 6, 1, "cmdoption-arg-allow_tf32", "allow_tf32"], [4, 6, 1, "cmdoption-arg-approach", "approach"], [4, 6, 1, "cmdoption-arg-atol", "atol"], [5, 6, 1, "cmdoption-arg-azureml_client", "azureml_client"], [4, 6, 1, "cmdoption-arg-backend", "backend"], [4, 6, 1, "cmdoption-arg-batch_size", "batch_size"], [4, 6, 1, "cmdoption-arg-bias", "bias"], [4, 6, 1, "cmdoption-arg-blocksize", "blocksize"], [4, 6, 1, "cmdoption-arg-calibrate_method", "calibrate_method"], [4, 6, 1, "cmdoption-arg-calibration_sampling_size", "calibration_sampling_size"], [4, 6, 1, "cmdoption-arg-checkpoint_path", "checkpoint_path"], [4, 6, 1, "cmdoption-arg-compute_device", "compute_device"], [4, 6, 1, "cmdoption-arg-compute_dtype", "compute_dtype"], [4, 6, 1, "cmdoption-arg-convert_attribute", "convert_attribute"], [4, 6, 1, "cmdoption-arg-cpu_cores", "cpu_cores"], [4, 6, 1, "cmdoption-arg-data_config", "data_config"], [4, 6, 1, "cmdoption-arg-data_dir", "data_dir"], [4, 6, 1, "cmdoption-arg-dataloader_func", "dataloader_func"], [4, 6, 1, "cmdoption-arg-dataloader_func_kwargs", "dataloader_func_kwargs"], [5, 6, 1, "cmdoption-arg-datastore_name", "datastore_name"], [5, 6, 1, "cmdoption-arg-datastore_url", "datastore_url"], [4, 6, 1, "cmdoption-arg-device", "device"], [4, 6, 1, "cmdoption-arg-disable_shape_infer", "disable_shape_infer"], [4, 6, 1, "cmdoption-arg-do_validate", "do_validate"], [4, 6, 1, "cmdoption-arg-domain", "domain"], [4, 6, 1, "cmdoption-arg-double_quant", "double_quant"], [4, 6, 1, "cmdoption-arg-enable_cuda_graph", "enable_cuda_graph"], [4, 6, 1, "cmdoption-arg-enable_dpu", "enable_dpu"], [4, 6, 1, "cmdoption-arg-enable_htp", "enable_htp"], [4, 6, 1, "cmdoption-arg-engine_config", "engine_config"], [4, 6, 1, "cmdoption-arg-eval_data_config", "eval_data_config"], [4, 6, 1, "cmdoption-arg-eval_dataset_size", "eval_dataset_size"], [4, 6, 1, "cmdoption-arg-excluded_precisions", "excluded_precisions"], [4, 6, 1, "cmdoption-arg-execution_mode_list", "execution_mode_list"], [4, 6, 1, "cmdoption-arg-external_data_name", "external_data_name"], [4, 6, 1, "cmdoption-arg-extra_args", "extra_args"], [4, 6, 1, "cmdoption-arg-extra_config", "extra_config"], [4, 6, 1, "cmdoption-arg-extra_options", "extra_options"], [4, 6, 1, "cmdoption-arg-extra_session_config", "extra_session_config"], [4, 6, 1, "cmdoption-arg-float16", "float16"], [4, 6, 1, "cmdoption-arg-force_fp16_inputs", "force_fp16_inputs"], [4, 6, 1, "cmdoption-arg-force_fp32_nodes", "force_fp32_nodes"], [4, 6, 1, "cmdoption-arg-force_fp32_ops", "force_fp32_ops"], [4, 6, 1, "cmdoption-arg-fp16", "fp16"], [4, 6, 1, "cmdoption-arg-gpus", "gpus"], [6, 6, 1, "cmdoption-arg-group", "group"], [4, 6, 1, "cmdoption-arg-hidden_size", "hidden_size"], [4, 6, 1, "cmdoption-arg-htp_socs", "htp_socs"], [4, 6, 1, "cmdoption-arg-input", "input"], [4, 6, 1, "cmdoption-arg-input_int32", "input_int32"], [4, 6, 1, "cmdoption-arg-input_layouts", "input_layouts"], [4, 6, 1, "cmdoption-arg-input_names", "input_names"], [4, 6, 1, "cmdoption-arg-input_nodes", "input_nodes"], [4, 6, 1, "cmdoption-arg-input_shape", "input_shape"], [4, 6, 1, "cmdoption-arg-input_shapes", "input_shapes"], [4, 6, 1, "cmdoption-arg-input_types", "input_types"], [4, 6, 1, "cmdoption-arg-inter_thread_num_list", "inter_thread_num_list"], [4, 6, 1, "cmdoption-arg-intra_thread_num_list", "intra_thread_num_list"], [4, 6, 1, "cmdoption-arg-io_bind", "io_bind"], [5, 6, 1, "cmdoption-arg-job_name", "job_name"], [4, 6, 1, "cmdoption-arg-keep_io_types", "keep_io_types"], [4, 6, 1, "cmdoption-arg-layer_name_filter", "layer_name_filter"], [4, 6, 1, "cmdoption-arg-logger", "logger"], [4, 6, 1, "cmdoption-arg-lora_alpha", "lora_alpha"], [4, 6, 1, "cmdoption-arg-lora_dropout", "lora_dropout"], [4, 6, 1, "cmdoption-arg-lora_r", "lora_r"], [4, 6, 1, "cmdoption-arg-max_finite_val", "max_finite_val"], [4, 6, 1, "cmdoption-arg-max_layer", "max_layer"], [4, 6, 1, "cmdoption-arg-metric", "metric"], [4, 6, 1, "cmdoption-arg-metric_func", "metric_func"], [4, 6, 1, "cmdoption-arg-min_layer", "min_layer"], [4, 6, 1, "cmdoption-arg-min_positive_val", "min_positive_val"], [4, 6, 1, "cmdoption-arg-model_type", "model_type"], [4, 6, 1, "cmdoption-arg-modules_to_fuse", "modules_to_fuse"], [4, 6, 1, "cmdoption-arg-modules_to_save", "modules_to_save"], [6, 6, 1, "cmdoption-arg-multivariate", "multivariate"], [5, 6, 1, "cmdoption-arg-name", "name"], [4, 6, 1, "cmdoption-arg-need_layer_fusing", "need_layer_fusing"], [4, 6, 1, "cmdoption-arg-no_post_process", "no_post_process"], [4, 6, 1, "cmdoption-arg-no_repeat_ngram_size", "no_repeat_ngram_size"], [4, 6, 1, "cmdoption-arg-node_block_list", "node_block_list"], [4, 6, 1, "cmdoption-arg-nodes_to_exclude", "nodes_to_exclude"], [4, 6, 1, "cmdoption-arg-nodes_to_quantize", "nodes_to_quantize"], [4, 6, 1, "cmdoption-arg-num_epochs", "num_epochs"], [4, 6, 1, "cmdoption-arg-num_heads", "num_heads"], [6, 6, 1, "cmdoption-arg-num_samples", "num_samples"], [4, 6, 1, "cmdoption-arg-num_steps", "num_steps"], [4, 6, 1, "cmdoption-arg-only_onnxruntime", "only_onnxruntime"], [4, 6, 1, "cmdoption-arg-op_block_list", "op_block_list"], [4, 6, 1, "cmdoption-arg-op_type_dict", "op_type_dict"], [4, 6, 1, "cmdoption-arg-op_types_to_quantize", "op_types_to_quantize"], [4, 6, 1, "cmdoption-arg-opt_level", "opt_level"], [4, 6, 1, "cmdoption-arg-opt_level_list", "opt_level_list"], [4, 6, 1, "cmdoption-arg-optimization_options", "optimization_options"], [4, 6, 1, "cmdoption-arg-optimize_model", "optimize_model"], [4, 6, 1, "cmdoption-arg-ortmodule_onnx_opset_version", "ortmodule_onnx_opset_version"], [5, 6, 1, "cmdoption-arg-output_name", "output_name"], [4, 6, 1, "cmdoption-arg-output_names", "output_names"], [4, 6, 1, "cmdoption-arg-output_nodes", "output_nodes"], [4, 6, 1, "cmdoption-arg-parallel_jobs", "parallel_jobs"], [5, 6, 1, "cmdoption-arg-path", "path"], [4, 6, 1, "cmdoption-arg-per_channel", "per_channel"], [4, 6, 1, "cmdoption-arg-percdamp", "percdamp"], [4, 6, 1, "cmdoption-arg-post", "post"], [4, 6, 1, "cmdoption-arg-pre", "pre"], [4, 6, 1, "cmdoption-arg-providers_list", "providers_list"], [4, 6, 1, "cmdoption-arg-ptl_data_module", "ptl_data_module"], [4, 6, 1, "cmdoption-arg-ptl_module", "ptl_module"], [4, 6, 1, "cmdoption-arg-qconfig_func", "qconfig_func"], [4, 6, 1, "cmdoption-arg-quant_format", "quant_format"], [4, 6, 1, "cmdoption-arg-quant_level", "quant_level"], [4, 6, 1, "cmdoption-arg-quant_mode", "quant_mode"], [4, 6, 1, "cmdoption-arg-quant_preprocess", "quant_preprocess"], [4, 6, 1, "cmdoption-arg-quant_type", "quant_type"], [4, 6, 1, "cmdoption-arg-recipes", "recipes"], [4, 6, 1, "cmdoption-arg-reduce_range", "reduce_range"], [5, 6, 1, "cmdoption-arg-relative_path", "relative_path"], [4, 6, 1, "cmdoption-arg-save_as_external_data", "save_as_external_data"], [4, 6, 1, "cmdoption-arg-script_dir", "script_dir"], [4, 6, 1, "cmdoption-arg-seed", "seed"], [4, 6, 1, "cmdoption-arg-size_threshold", "size_threshold"], [4, 6, 1, "cmdoption-arg-sparsity", "sparsity"], [4, 6, 1, "cmdoption-arg-strict", "strict"], [4, 6, 1, "cmdoption-arg-target_device", "target_device"], [4, 6, 1, "cmdoption-arg-target_modules", "target_modules"], [4, 6, 1, "cmdoption-arg-target_opset", "target_opset"], [4, 6, 1, "cmdoption-arg-tool_command", "tool_command"], [4, 6, 1, "cmdoption-arg-tool_command_args", "tool_command_args"], [4, 6, 1, "cmdoption-arg-torch_dtype", "torch_dtype"], [4, 6, 1, "cmdoption-arg-train_batch_size", "train_batch_size"], [4, 6, 1, "cmdoption-arg-train_data_config", "train_data_config"], [4, 6, 1, "cmdoption-arg-train_data_dir", "train_data_dir"], [4, 6, 1, "cmdoption-arg-train_dataloader_func", "train_dataloader_func"], [4, 6, 1, "cmdoption-arg-training_args", "training_args"], [4, 6, 1, "cmdoption-arg-training_loop_func", "training_loop_func"], [4, 6, 1, "cmdoption-arg-trt_fp16_enable", "trt_fp16_enable"], [4, 6, 1, "cmdoption-arg-tuning_criterion", "tuning_criterion"], [4, 6, 1, "cmdoption-arg-use_device", "use_device"], [4, 6, 1, "cmdoption-arg-use_dynamo_exporter", "use_dynamo_exporter"], [4, 6, 1, "cmdoption-arg-use_enhanced_quantizer", "use_enhanced_quantizer"], [4, 6, 1, "cmdoption-arg-use_external_data_format", "use_external_data_format"], [4, 6, 1, "cmdoption-arg-use_forced_decoder_ids", "use_forced_decoder_ids"], [4, 6, 1, "cmdoption-arg-use_gpu", "use_gpu"], [4, 6, 1, "cmdoption-arg-use_gqa", "use_gqa"], [4, 6, 1, "cmdoption-arg-use_ort_trainer", "use_ort_trainer"], [4, 6, 1, "cmdoption-arg-user_script", "user_script"], [4, 6, 1, "cmdoption-arg-val_data_dir", "val_data_dir"], [5, 6, 1, "cmdoption-arg-version", "version"], [4, 6, 1, "cmdoption-arg-weight_only_config", "weight_only_config"], [4, 6, 1, "cmdoption-arg-weight_type", "weight_type"], [6, 6, 1, "cmdoption-arg-with_replacement", "with_replacement"]], "extra.Sigmoid": [[4, 6, 1, "cmdoption-arg-extra.Sigmoid.nnapi", "nnapi"]]}, "objtypes": {"0": "py:pydantic_settings", "1": "py:pydantic_field", "2": "py:method", "3": "py:class", "4": "py:attribute", "5": "py:module", "6": "std:cmdoption"}, "objnames": {"0": ["py", "pydantic_settings", "Python settings"], "1": ["py", "pydantic_field", "Python field"], "2": ["py", "method", "Python method"], "3": ["py", "class", "Python class"], "4": ["py", "attribute", "Python attribute"], "5": ["py", "module", "Python module"], "6": ["std", "cmdoption", "program option"]}, "titleterms": {"engin": [0, 9, 26, 27, 28], "engineconfig": 0, "searchstrategi": 0, "oliveevalu": 1, "metric": [2, 13, 32], "metrictyp": 2, "accuracysubtyp": 2, "latencysubtyp": 2, "throughputsubtyp": 2, "metricgo": 2, "olivemodel": 3, "model": [3, 11, 13, 14, 16, 17, 19, 21, 23, 26, 27, 28, 33], "configur": [3, 10, 16, 17, 18, 19, 31, 32, 34, 35], "onnx": [3, 16], "compositeonnxmodel": 3, "distributedonnxmodel": 3, "openvino": [3, 17], "pytorch": [3, 18], "distributedpytorchmodel": 3, "snpe": [3, 19], "compositepytorchmodel": 3, "pass": [4, 9, 10, 26, 27, 28, 34], "onnxconvers": 4, "onnxopversionconvers": 4, "onnxmodeloptim": 4, "orttransformersoptim": 4, "ortperftun": 4, "onnxfloattofloat16": 4, "ortmixedprecis": 4, "onnxdynamicquant": 4, "onnxstaticquant": 4, "onnxquant": 4, "incdynamicquant": 4, "incstaticquant": 4, "incquant": 4, "appendprepostprocessingop": 4, "insertbeamsearch": 4, "lora": [4, 18], "qlora": [4, 18], "hftrainingargu": 4, "quantizationawaretrain": 4, "openvinoconvers": 4, "openvinoquant": 4, "snpeconvers": 4, "snpequant": 4, "snpetoonnxconvers": 4, "sparsegpt": [4, 18], "torchtrtconvers": [4, 18], "vitisaiquant": 4, "optimumconvers": 4, "optimummerg": 4, "resourcepath": 5, "resourcetyp": 5, "localfil": 5, "localfold": 5, "stringnam": 5, "azuremlmodel": 5, "azuremldatastor": 5, "azuremljoboutput": 5, "searchalgorithm": 6, "exhaustivesearchalgorithm": 6, "randomsearchalgorithm": 6, "tpesearchalgorithm": 6, "olivesystem": 7, "config": [7, 13, 15, 21, 23, 26, 31], "systemtyp": 7, "localtargetuserconfig": 7, "dockertargetuserconfig": 7, "azuremltargetuserconfig": 7, "pythonenvironmenttargetuserconfig": 7, "class": [7, 10], "localsystem": 7, "azuremlsystem": 7, "dockersystem": 7, "pythonenvironmentsystem": 7, "system": [7, 9, 19, 26, 28, 35], "alia": 7, "acceler": [8, 27], "cpu": [8, 21, 23], "gpu": 8, "npu": 8, "dpu": 8, "design": 9, "evalu": [9, 26, 28], "search": [9, 16], "strategi": 9, "execut": 9, "order": 9, "algorithm": 9, "how": [10, 15, 31, 32, 33, 34, 35], "add": [10, 29], "new": 10, "optim": [10, 13, 14, 16, 21, 23], "1": [10, 17], "defin": 10, "2": [10, 17], "exampl": [10, 12, 13, 16, 17, 18, 19, 22, 24, 26], "3": 10, "implement": 10, "run": [10, 21, 23, 28], "function": 10, "azur": [11, 26, 29, 30], "ml": [11, 26, 30], "integr": 11, "oliv": [11, 15, 17, 19, 24, 25, 26, 27], "core": 11, "us": [11, 21, 23], "azureml": [11, 26, 33, 35], "regist": [11, 28], "curat": 11, "store": 11, "datastor": [11, 33], "from": [11, 17, 20], "an": 11, "job": [11, 33], "output": [11, 33], "data": [11, 23, 26, 31], "comput": 11, "host": [11, 28, 29], "target": [11, 28], "connect": 11, "your": 11, "own": 11, "devic": 11, "arc": [11, 29], "helper": 11, "script": [11, 12, 13, 30], "custom": [12, 13, 31, 32], "user_script": 12, "script_dir": 12, "huggingfac": 13, "introduct": 13, "dataset": 13, "compon": [13, 31], "e2": 13, "transform": [14, 16], "packag": 15, "artifact": 15, "what": 15, "i": 15, "zipfil": 15, "candidatemodel": 15, "infer": 15, "file": [15, 33], "samplecod": 15, "convers": [16, 17, 19], "ort": 16, "append": 16, "pre": 16, "post": [16, 17, 19], "process": 16, "op": 16, "insert": 16, "beam": 16, "train": [16, 17, 18, 19], "quantiz": [16, 17, 18, 19], "ptq": [16, 17, 19, 21, 23], "onnxruntim": 16, "intel": 16, "neural": 16, "compressor": 16, "amd": 16, "viti": 16, "ai": 16, "perform": [16, 27], "tune": 16, "float16": 16, "mix": 16, "precis": 16, "prerequisit": [17, 19, 21, 23, 35], "option": [17, 20, 26], "instal": [17, 19, 20], "extra": 17, "runtim": 17, "develop": 17, "tool": 17, "pypi": 17, "awar": 18, "download": 19, "unzip": 19, "sdk": 19, "depend": [19, 20], "pip": [20, 21, 23], "sourc": 20, "edit": 20, "bert": 21, "requir": [21, 23, 27], "sampl": [21, 23], "The": 21, "techniqu": 21, "ar": 21, "specifi": 21, "bert_ptq_cpu": 21, "json": [21, 26], "automat": 21, "without": 21, "select": 21, "ani": 21, "quickstart": 22, "resnet": 23, "prepar": 23, "welcom": 24, "": 24, "document": 24, "overview": 24, "get": 24, "start": 24, "featur": 24, "extend": 24, "tutori": 24, "api": 24, "refer": 24, "content": 25, "client": 26, "azureml_cli": 26, "aml_config_path": 26, "aml_config": 26, "field": 26, "input": [26, 27, 28], "inform": [26, 27], "local": [26, 29, 33, 35], "flow": 26, "quick": 27, "tour": [27, 28], "need": 27, "appli": 27, "advanc": 28, "user": 28, "self": 29, "kubernet": 29, "cluster": 29, "creat": 29, "aml": 29, "extens": 29, "link": 29, "machin": 29, "learn": 29, "list": 30, "manage_compute_inst": 30, "usag": 30, "To": [31, 32, 33, 34, 35], "support": 31, "templat": 31, "gener": 31, "titl": 31, "built": 31, "type": 32, "accuraci": 32, "latenc": 32, "throughput": 32, "multi": 32, "set": 33, "path": 33, "folder": 33, "string": 33, "name": 33, "remot": 33, "registri": 33, "readymad": 35, "docker": 35, "python": 35, "environ": 35}, "envversion": {"sphinx.domains.c": 3, "sphinx.domains.changeset": 1, "sphinx.domains.citation": 1, "sphinx.domains.cpp": 9, "sphinx.domains.index": 1, "sphinx.domains.javascript": 3, "sphinx.domains.math": 2, "sphinx.domains.python": 4, "sphinx.domains.rst": 2, "sphinx.domains.std": 2, "sphinx.ext.intersphinx": 1, "sphinx.ext.todo": 2, "sphinx.ext.viewcode": 1, "sphinx": 58}, "alltitles": {"Engine": [[0, "engine"], [0, "id2"], [9, "engine"], [28, "engine"]], "EngineConfig": [[0, "engineconfig"]], "SearchStrategy": [[0, "searchstrategy"]], "OliveEvaluator": [[1, "oliveevaluator"], [1, "id1"]], "Metric": [[2, "metric"], [2, "id2"]], "MetricType": [[2, "metrictype"]], "AccuracySubType": [[2, "accuracysubtype"]], "LatencySubType": [[2, "latencysubtype"]], "ThroughputSubType": [[2, "throughputsubtype"]], "MetricGoal": [[2, "metricgoal"]], "OliveModels": [[3, "olivemodels"]], "Model Configuration": [[3, "model-configuration"]], "ONNX Model": [[3, "onnx-model"]], "CompositeOnnxModel Model": [[3, "compositeonnxmodel-model"]], "DistributedOnnxModel Model": [[3, "distributedonnxmodel-model"]], "OpenVINO Model": [[3, "openvino-model"]], "PyTorch Model": [[3, "pytorch-model"]], "DistributedPyTorchModel Model": [[3, "distributedpytorchmodel-model"]], "SNPE Model": [[3, "snpe-model"]], "CompositePyTorchModel Model": [[3, "compositepytorchmodel-model"]], "Passes": [[4, "passes"]], "OnnxConversion": [[4, "onnxconversion"]], "OnnxOpVersionConversion": [[4, "onnxopversionconversion"]], "OnnxModelOptimizer": [[4, "onnxmodeloptimizer"]], "OrtTransformersOptimization": [[4, "orttransformersoptimization"]], "OrtPerfTuning": [[4, "ortperftuning"]], "OnnxFloatToFloat16": [[4, "onnxfloattofloat16"]], "OrtMixedPrecision": [[4, "ortmixedprecision"]], "OnnxDynamicQuantization": [[4, "onnxdynamicquantization"]], "OnnxStaticQuantization": [[4, "onnxstaticquantization"]], "OnnxQuantization": [[4, "onnxquantization"]], "IncDynamicQuantization": [[4, "incdynamicquantization"]], "IncStaticQuantization": [[4, "incstaticquantization"]], "IncQuantization": [[4, "incquantization"]], "AppendPrePostProcessingOps": [[4, "appendprepostprocessingops"]], "InsertBeamSearch": [[4, "insertbeamsearch"]], "LoRA": [[4, "lora"], [18, "lora"]], "QLoRA": [[4, "qlora"], [18, "qlora"]], "LoRA/QLoRA HFTrainingArguments": [[4, "lora-qlora-hftrainingarguments"]], "QuantizationAwareTraining": [[4, "quantizationawaretraining"]], "OpenVINOConversion": [[4, "openvinoconversion"]], "OpenVINOQuantization": [[4, "openvinoquantization"]], "SNPEConversion": [[4, "snpeconversion"]], "SNPEQuantization": [[4, "snpequantization"]], "SNPEtoONNXConversion": [[4, "snpetoonnxconversion"]], "SparseGPT": [[4, "sparsegpt"], [18, "sparsegpt"]], "TorchTRTConversion": [[4, "torchtrtconversion"], [18, "torchtrtconversion"]], "VitisAIQuantization": [[4, "vitisaiquantization"]], "OptimumConversion": [[4, "optimumconversion"]], "OptimumMerging": [[4, "optimummerging"]], "ResourcePath": [[5, "resourcepath"]], "ResourceType": [[5, "resourcetype"]], "LocalFile": [[5, "localfile"]], "LocalFolder": [[5, "localfolder"]], "StringName": [[5, "stringname"]], "AzureMLModel": [[5, "azuremlmodel"]], "AzureMLDatastore": [[5, "azuremldatastore"]], "AzureMLJobOutput": [[5, "azuremljoboutput"]], "SearchAlgorithms": [[6, "searchalgorithms"]], "ExhaustiveSearchAlgorithm": [[6, "exhaustivesearchalgorithm"]], "RandomSearchAlgorithm": [[6, "randomsearchalgorithm"]], "TPESearchAlgorithm": [[6, "tpesearchalgorithm"]], "OliveSystems": [[7, "olivesystems"]], "Config": [[7, "config"]], "SystemType": [[7, "systemtype"]], "LocalTargetUserConfig": [[7, "localtargetuserconfig"]], "DockerTargetUserConfig": [[7, "dockertargetuserconfig"]], "AzureMLTargetUserConfig": [[7, "azuremltargetuserconfig"]], "PythonEnvironmentTargetUserConfig": [[7, "pythonenvironmenttargetuserconfig"]], "Classes": [[7, "classes"]], "LocalSystem": [[7, "localsystem"]], "AzureMLSystem": [[7, "azuremlsystem"]], "DockerSystem": [[7, "dockersystem"]], "PythonEnvironmentSystem": [[7, "pythonenvironmentsystem"]], "System Alias": [[7, "module-olive.systems.system_alias"]], "Acceleration on CPU": [[8, "acceleration-on-cpu"]], "Acceleration on GPU": [[8, "acceleration-on-gpu"]], "Acceleration on NPU": [[8, "acceleration-on-npu"]], "Acceleration on DPU": [[8, "acceleration-on-dpu"]], "Design": [[9, "design"]], "Pass": [[9, "pass"]], "System": [[9, "system"]], "Evaluator": [[9, "evaluator"], [28, "evaluator"]], "Search Strategy": [[9, "search-strategy"]], "Execution Order": [[9, "execution-order"]], "Search Algorithm": [[9, "search-algorithm"]], "How to add new optimization Pass": [[10, "how-to-add-new-optimization-pass"]], "1. Define a new class": [[10, "define-a-new-class"]], "2. Define configuration": [[10, "define-configuration"]], "Example": [[10, "example"], [13, "example"], [26, "example"], [26, "id1"], [26, "id2"], [26, "id3"], [26, "id4"], [26, "id5"], [26, "id6"]], "3. Implement the run function": [[10, "implement-the-run-function"]], "Azure ML integration": [[11, "azure-ml-integration"]], "Olive Core": [[11, "olive-core"]], "Using AzureML registered model": [[11, "using-azureml-registered-model"]], "Using AzureML curated model": [[11, "using-azureml-curated-model"]], "Using model stored in AzureML datastore": [[11, "using-model-stored-in-azureml-datastore"]], "Using a model from an AzureML job output": [[11, "using-a-model-from-an-azureml-job-output"]], "Using data stored in AzureML datastore": [[11, "using-data-stored-in-azureml-datastore"]], "Using Azure ML compute as host or target": [[11, "using-azure-ml-compute-as-host-or-target"]], "Connect your own device to Azure ML as target or host by Azure Arc": [[11, "connect-your-own-device-to-azure-ml-as-target-or-host-by-azure-arc"]], "Azure ML Helper Scripts": [[11, "azure-ml-helper-scripts"]], "Custom Scripts": [[12, "custom-scripts"]], "user_script": [[12, "user-script"]], "Examples": [[12, "examples"], [12, "id1"]], "script_dir": [[12, "script-dir"]], "Huggingface Model Optimization": [[13, "huggingface-model-optimization"]], "Introduction": [[13, "introduction"]], "Model config and dataset config": [[13, "model-config-and-dataset-config"]], "Metric config": [[13, "metric-config"]], "Custom components config": [[13, "custom-components-config"]], "Script example": [[13, "script-example"]], "E2E example": [[13, "e2e-example"]], "Model Transformations and Optimizations": [[14, "model-transformations-and-optimizations"]], "Packaging Olive artifacts": [[15, "packaging-olive-artifacts"]], "What is Olive Packaging": [[15, "what-is-olive-packaging"]], "Zipfile": [[15, "zipfile"]], "CandidateModels": [[15, "candidatemodels"]], "Inference config file": [[15, "inference-config-file"]], "SampleCode": [[15, "samplecode"]], "How to package Olive artifacts": [[15, "how-to-package-olive-artifacts"]], "ONNX": [[16, "onnx"]], "Model Conversion": [[16, "model-conversion"], [17, "model-conversion"], [19, "model-conversion"]], "Example Configuration": [[16, "example-configuration"], [16, "id1"], [16, "id2"], [16, "id3"], [16, "id4"], [16, "id5"], [16, "id6"], [16, "id7"], [16, "id8"], [17, "example-configuration"], [17, "id1"], [18, "example-configuration"], [18, "id1"], [18, "id2"], [18, "id3"], [18, "id4"], [19, "example-configuration"], [19, "id1"]], "Model Optimizer": [[16, "model-optimizer"]], "ORT Transformers Optimization": [[16, "ort-transformers-optimization"]], "Append Pre/Post Processing Ops": [[16, "append-pre-post-processing-ops"]], "Insert Beam Search Op": [[16, "insert-beam-search-op"]], "Post Training Quantization (PTQ)": [[16, "post-training-quantization-ptq"], [17, "post-training-quantization-ptq"], [19, "post-training-quantization-ptq"]], "Quantize with onnxruntime": [[16, "quantize-with-onnxruntime"]], "Quantize with Intel\u00ae Neural Compressor": [[16, "quantize-with-intel-neural-compressor"]], "Quantize with AMD Vitis AI Quantizer": [[16, "quantize-with-amd-vitis-ai-quantizer"]], "ORT Performance Tuning": [[16, "ort-performance-tuning"]], "Float16 Conversion": [[16, "float16-conversion"]], "Mixed Precision Conversion": [[16, "mixed-precision-conversion"]], "OpenVINO": [[17, "openvino"]], "Prerequisites": [[17, "prerequisites"], [19, "prerequisites"], [21, "prerequisites"], [23, "prerequisites"], [35, "prerequisites"], [35, "id2"]], "Option 1: install Olive with OpenVINO extras": [[17, "option-1-install-olive-with-openvino-extras"]], "Option 2: Install OpenVINO Runtime and OpenVINO Development Tools from Pypi": [[17, "option-2-install-openvino-runtime-and-openvino-development-tools-from-pypi"]], "PyTorch": [[18, "pytorch"]], "Quantization Aware Training": [[18, "quantization-aware-training"]], "SNPE": [[19, "snpe"]], "Download and unzip SNPE SDK": [[19, "download-and-unzip-snpe-sdk"]], "Install SDK system dependencies": [[19, "install-sdk-system-dependencies"]], "Configure Olive SNPE": [[19, "configure-olive-snpe"]], "Installation": [[20, "installation"]], "Install with pip": [[20, "install-with-pip"]], "Install from source": [[20, "install-from-source"]], "Editable install": [[20, "editable-install"]], "Optional Dependencies": [[20, "optional-dependencies"]], "BERT optimization with PTQ on CPU": [[21, "bert-optimization-with-ptq-on-cpu"]], "Pip requirements": [[21, "pip-requirements"], [23, "pip-requirements"]], "Run sample using config. The optimization techniques to run are specified in bert_ptq_cpu.json": [[21, "run-sample-using-config-the-optimization-techniques-to-run-are-specified-in-bert-ptq-cpu-json"]], "Optimize model automatically without selecting any optimization technique.": [[21, "optimize-model-automatically-without-selecting-any-optimization-technique"]], "Quickstart Examples": [[22, "quickstart-examples"]], "ResNet optimization with PTQ on CPU": [[23, "resnet-optimization-with-ptq-on-cpu"]], "Prepare data and model": [[23, "prepare-data-and-model"]], "Run sample using config": [[23, "run-sample-using-config"]], "Welcome to Olive\u2019s documentation!": [[24, "welcome-to-olive-s-documentation"]], "OVERVIEW": [[24, null]], "GET STARTED": [[24, null]], "EXAMPLES": [[24, null]], "FEATURES": [[24, null]], "EXTENDING OLIVE": [[24, null]], "TUTORIALS": [[24, null]], "API REFERENCE": [[24, null]], "Olive": [[25, "olive"]], "Contents": [[25, "contents"]], "Olive Options": [[26, "olive-options"]], "Azure ML Client": [[26, "azure-ml-client"]], "azureml_client with aml_config_path:": [[26, "azureml-client-with-aml-config-path"]], "aml_config.json:": [[26, "aml-config-json"]], "azureml_client:": [[26, "azureml-client"]], "azureml_client with azureml config fields:": [[26, "azureml-client-with-azureml-config-fields"]], "Input Model Information": [[26, "input-model-information"]], "Data Information": [[26, "data-information"]], "Local Examples": [[26, "local-examples"]], "Azureml Examples": [[26, "azureml-examples"]], "Systems Information": [[26, "systems-information"]], "Evaluators Information": [[26, "evaluators-information"]], "Passes Information": [[26, "passes-information"]], "Pass Flows Information": [[26, "pass-flows-information"]], "Engine Information": [[26, "engine-information"]], "Quick Tour": [[27, "quick-tour"]], "Information needed to accelerate a model": [[27, "information-needed-to-accelerate-a-model"]], "Input Model": [[27, "input-model"], [28, "input-model"]], "Performance Requirement": [[27, "performance-requirement"]], "Passes to apply": [[27, "passes-to-apply"]], "Olive Engine": [[27, "olive-engine"]], "Advanced User Tour": [[28, "advanced-user-tour"]], "Host and Target Systems": [[28, "host-and-target-systems"]], "Register Passes": [[28, "register-passes"]], "Run the engine": [[28, "run-the-engine"]], "Self-hosted Kubernetes cluster": [[29, "self-hosted-kubernetes-cluster"]], "Create Kubernetes cluster": [[29, "create-kubernetes-cluster"]], "Add local Kubernetes cluster to Azure Arc": [[29, "add-local-kubernetes-cluster-to-azure-arc"]], "Add AML extension to cluster": [[29, "add-aml-extension-to-cluster"]], "Link Azure Arc Kubernetes cluster to Azure Machine Learning": [[29, "link-azure-arc-kubernetes-cluster-to-azure-machine-learning"]], "Azure ML scripts": [[30, "azure-ml-scripts"]], "Scripts list": [[30, "scripts-list"]], "manage_compute_instance": [[30, "manage-compute-instance"]], "Usage": [[30, "usage"]], "How To Configure Data": [[31, "how-to-configure-data"]], "Supported Data Config Template": [[31, "supported-data-config-template"]], "Generic Data Config": [[31, "generic-data-config"]], "Title": [[31, "id5"]], "Configs with built-in component:": [[31, "configs-with-built-in-component"]], "Configs with customized component:": [[31, "configs-with-customized-component"]], "How To Configure Metric": [[32, "how-to-configure-metric"]], "Metric Types": [[32, "metric-types"]], "Accuracy Metric": [[32, "accuracy-metric"]], "Latency Metric": [[32, "latency-metric"]], "Throughput Metric": [[32, "throughput-metric"]], "Custom Metric": [[32, "custom-metric"]], "Multi Metrics configuration": [[32, "multi-metrics-configuration"]], "How To Set Model Path": [[33, "how-to-set-model-path"]], "Local Model Path": [[33, "local-model-path"]], "Local File": [[33, "local-file"]], "Local Folder": [[33, "local-folder"]], "String Name": [[33, "string-name"]], "Remote Model Path": [[33, "remote-model-path"]], "AzureML Model": [[33, "azureml-model"]], "AzureML Registry Model": [[33, "azureml-registry-model"]], "AzureML Datastore": [[33, "azureml-datastore"]], "AzureML Job Output": [[33, "azureml-job-output"]], "How To Configure Pass": [[34, "how-to-configure-pass"]], "How To Configure System": [[35, "how-to-configure-system"]], "Local System": [[35, "local-system"]], "AzureML System": [[35, "azureml-system"]], "System Configuration": [[35, "system-configuration"], [35, "id3"]], "AzureML Readymade Systems": [[35, "azureml-readymade-systems"]], "Docker System": [[35, "docker-system"]], "Python Environment System": [[35, "python-environment-system"]]}, "indexentries": {"engine (class in olive.engine)": [[0, "olive.engine.Engine"]], "searchstrategy (class in olive.strategy.search_strategy)": [[0, "olive.strategy.search_strategy.SearchStrategy"]], "azureml_client_config (olive.engine.engineconfig attribute)": [[0, "olive.engine.EngineConfig.azureml_client_config"]], "cache_dir (olive.engine.engineconfig attribute)": [[0, "olive.engine.EngineConfig.cache_dir"]], "clean_cache (olive.engine.engineconfig attribute)": [[0, "olive.engine.EngineConfig.clean_cache"]], "clean_evaluation_cache (olive.engine.engineconfig attribute)": [[0, "olive.engine.EngineConfig.clean_evaluation_cache"]], "evaluator (olive.engine.engineconfig attribute)": [[0, "olive.engine.EngineConfig.evaluator"]], "execution_order (olive.strategy.search_strategy.searchstrategyconfig attribute)": [[0, "olive.strategy.search_strategy.SearchStrategyConfig.execution_order"]], "execution_providers (olive.engine.engineconfig attribute)": [[0, "olive.engine.EngineConfig.execution_providers"]], "host (olive.engine.engineconfig attribute)": [[0, "olive.engine.EngineConfig.host"]], "max_iter (olive.strategy.search_strategy.searchstrategyconfig attribute)": [[0, "olive.strategy.search_strategy.SearchStrategyConfig.max_iter"]], "max_time (olive.strategy.search_strategy.searchstrategyconfig attribute)": [[0, "olive.strategy.search_strategy.SearchStrategyConfig.max_time"]], "metrics (olive.evaluator.olive_evaluator.oliveevaluatorconfig attribute)": [[0, "olive.evaluator.olive_evaluator.OliveEvaluatorConfig.metrics"]], "output_model_num (olive.strategy.search_strategy.searchstrategyconfig attribute)": [[0, "olive.strategy.search_strategy.SearchStrategyConfig.output_model_num"]], "packaging_config (olive.engine.engineconfig attribute)": [[0, "olive.engine.EngineConfig.packaging_config"]], "plot_pareto_frontier (olive.engine.engineconfig attribute)": [[0, "olive.engine.EngineConfig.plot_pareto_frontier"]], "register() (olive.engine.engine method)": [[0, "olive.engine.Engine.register"]], "run() (olive.engine.engine method)": [[0, "olive.engine.Engine.run"]], "search_algorithm (olive.strategy.search_strategy.searchstrategyconfig attribute)": [[0, "olive.strategy.search_strategy.SearchStrategyConfig.search_algorithm"]], "search_algorithm_config (olive.strategy.search_strategy.searchstrategyconfig attribute)": [[0, "olive.strategy.search_strategy.SearchStrategyConfig.search_algorithm_config"]], "search_strategy (olive.engine.engineconfig attribute)": [[0, "olive.engine.EngineConfig.search_strategy"]], "stop_when_goals_met (olive.strategy.search_strategy.searchstrategyconfig attribute)": [[0, "olive.strategy.search_strategy.SearchStrategyConfig.stop_when_goals_met"]], "target (olive.engine.engineconfig attribute)": [[0, "olive.engine.EngineConfig.target"]], "oliveevaluator (class in olive.evaluator.olive_evaluator)": [[1, "olive.evaluator.olive_evaluator.OliveEvaluator"]], "accuracy (olive.evaluator.metric.metrictype attribute)": [[2, "olive.evaluator.metric.MetricType.ACCURACY"]], "accuracy_score (olive.evaluator.metric.accuracysubtype attribute)": [[2, "olive.evaluator.metric.AccuracySubType.ACCURACY_SCORE"]], "auroc (olive.evaluator.metric.accuracysubtype attribute)": [[2, "olive.evaluator.metric.AccuracySubType.AUROC"]], "avg (olive.evaluator.metric.latencysubtype attribute)": [[2, "olive.evaluator.metric.LatencySubType.AVG"]], "avg (olive.evaluator.metric.throughputsubtype attribute)": [[2, "olive.evaluator.metric.ThroughputSubType.AVG"]], "accuracysubtype (class in olive.evaluator.metric)": [[2, "olive.evaluator.metric.AccuracySubType"]], "custom (olive.evaluator.metric.metrictype attribute)": [[2, "olive.evaluator.metric.MetricType.CUSTOM"]], "f1_score (olive.evaluator.metric.accuracysubtype attribute)": [[2, "olive.evaluator.metric.AccuracySubType.F1_SCORE"]], "latency (olive.evaluator.metric.metrictype attribute)": [[2, "olive.evaluator.metric.MetricType.LATENCY"]], "latencysubtype (class in olive.evaluator.metric)": [[2, "olive.evaluator.metric.LatencySubType"]], "max (olive.evaluator.metric.latencysubtype attribute)": [[2, "olive.evaluator.metric.LatencySubType.MAX"]], "max (olive.evaluator.metric.throughputsubtype attribute)": [[2, "olive.evaluator.metric.ThroughputSubType.MAX"]], "min (olive.evaluator.metric.latencysubtype attribute)": [[2, "olive.evaluator.metric.LatencySubType.MIN"]], "min (olive.evaluator.metric.throughputsubtype attribute)": [[2, "olive.evaluator.metric.ThroughputSubType.MIN"]], "metrictype (class in olive.evaluator.metric)": [[2, "olive.evaluator.metric.MetricType"]], "p50 (olive.evaluator.metric.latencysubtype attribute)": [[2, "olive.evaluator.metric.LatencySubType.P50"]], "p50 (olive.evaluator.metric.throughputsubtype attribute)": [[2, "olive.evaluator.metric.ThroughputSubType.P50"]], "p75 (olive.evaluator.metric.latencysubtype attribute)": [[2, "olive.evaluator.metric.LatencySubType.P75"]], "p75 (olive.evaluator.metric.throughputsubtype attribute)": [[2, "olive.evaluator.metric.ThroughputSubType.P75"]], "p90 (olive.evaluator.metric.latencysubtype attribute)": [[2, "olive.evaluator.metric.LatencySubType.P90"]], "p90 (olive.evaluator.metric.throughputsubtype attribute)": [[2, "olive.evaluator.metric.ThroughputSubType.P90"]], "p95 (olive.evaluator.metric.latencysubtype attribute)": [[2, "olive.evaluator.metric.LatencySubType.P95"]], "p95 (olive.evaluator.metric.throughputsubtype attribute)": [[2, "olive.evaluator.metric.ThroughputSubType.P95"]], "p99 (olive.evaluator.metric.latencysubtype attribute)": [[2, "olive.evaluator.metric.LatencySubType.P99"]], "p99 (olive.evaluator.metric.throughputsubtype attribute)": [[2, "olive.evaluator.metric.ThroughputSubType.P99"]], "p999 (olive.evaluator.metric.latencysubtype attribute)": [[2, "olive.evaluator.metric.LatencySubType.P999"]], "p999 (olive.evaluator.metric.throughputsubtype attribute)": [[2, "olive.evaluator.metric.ThroughputSubType.P999"]], "perplexity (olive.evaluator.metric.accuracysubtype attribute)": [[2, "olive.evaluator.metric.AccuracySubType.PERPLEXITY"]], "precision (olive.evaluator.metric.accuracysubtype attribute)": [[2, "olive.evaluator.metric.AccuracySubType.PRECISION"]], "recall (olive.evaluator.metric.accuracysubtype attribute)": [[2, "olive.evaluator.metric.AccuracySubType.RECALL"]], "throughput (olive.evaluator.metric.metrictype attribute)": [[2, "olive.evaluator.metric.MetricType.THROUGHPUT"]], "throughputsubtype (class in olive.evaluator.metric)": [[2, "olive.evaluator.metric.ThroughputSubType"]], "backend (olive.evaluator.metric.metric attribute)": [[2, "olive.evaluator.metric.Metric.backend"]], "data_config (olive.evaluator.metric.metric attribute)": [[2, "olive.evaluator.metric.Metric.data_config"]], "get_sub_type_info() (olive.evaluator.metric.metric method)": [[2, "olive.evaluator.metric.Metric.get_sub_type_info"]], "name (olive.evaluator.metric.metric attribute)": [[2, "olive.evaluator.metric.Metric.name"]], "sub_types (olive.evaluator.metric.metric attribute)": [[2, "olive.evaluator.metric.Metric.sub_types"]], "type (olive.evaluator.metric.metric attribute)": [[2, "olive.evaluator.metric.Metric.type"]], "type (olive.evaluator.metric.metricgoal attribute)": [[2, "olive.evaluator.metric.MetricGoal.type"]], "user_config (olive.evaluator.metric.metric attribute)": [[2, "olive.evaluator.metric.Metric.user_config"]], "value (olive.evaluator.metric.metricgoal attribute)": [[2, "olive.evaluator.metric.MetricGoal.value"]], "compositeonnxmodel (class in olive.model)": [[3, "olive.model.CompositeOnnxModel"]], "compositepytorchmodel (class in olive.model)": [[3, "olive.model.CompositePyTorchModel"]], "distributedonnxmodel (class in olive.model)": [[3, "olive.model.DistributedOnnxModel"]], "distributedpytorchmodel (class in olive.model)": [[3, "olive.model.DistributedPyTorchModel"]], "modelconfig (class in olive.model)": [[3, "olive.model.ModelConfig"]], "onnxmodel (class in olive.model)": [[3, "olive.model.ONNXModel"]], "openvinomodel (class in olive.model)": [[3, "olive.model.OpenVINOModel"]], "pytorchmodel (class in olive.model)": [[3, "olive.model.PyTorchModel"]], "snpemodel (class in olive.model)": [[3, "olive.model.SNPEModel"]], "activationsymmetric": [[4, "cmdoption-arg-223"], [4, "cmdoption-arg-51"], [4, "cmdoption-arg-81"], [4, "cmdoption-arg-ActivationSymmetric"]], "addqdqpairtoweight": [[4, "cmdoption-arg-AddQDQPairToWeight"]], "enablesubgraph": [[4, "cmdoption-arg-53"], [4, "cmdoption-arg-83"], [4, "cmdoption-arg-EnableSubgraph"]], "forcequantizenoinputcheck": [[4, "cmdoption-arg-54"], [4, "cmdoption-arg-84"], [4, "cmdoption-arg-ForceQuantizeNoInputCheck"]], "matmulconstbonly": [[4, "cmdoption-arg-55"], [4, "cmdoption-arg-85"], [4, "cmdoption-arg-MatMulConstBOnly"]], "weightsymmetric": [[4, "cmdoption-arg-224"], [4, "cmdoption-arg-52"], [4, "cmdoption-arg-82"], [4, "cmdoption-arg-WeightSymmetric"]], "activation_type": [[4, "cmdoption-arg-222"], [4, "cmdoption-arg-79"], [4, "cmdoption-arg-activation_type"]], "algorithms": [[4, "cmdoption-arg-algorithms"]], "all_tensors_to_one_file": [[4, "cmdoption-arg-12"], [4, "cmdoption-arg-120"], [4, "cmdoption-arg-146"], [4, "cmdoption-arg-152"], [4, "cmdoption-arg-158"], [4, "cmdoption-arg-197"], [4, "cmdoption-arg-2"], [4, "cmdoption-arg-20"], [4, "cmdoption-arg-227"], [4, "cmdoption-arg-238"], [4, "cmdoption-arg-243"], [4, "cmdoption-arg-26"], [4, "cmdoption-arg-31"], [4, "cmdoption-arg-58"], [4, "cmdoption-arg-7"], [4, "cmdoption-arg-88"], [4, "cmdoption-arg-95"], [4, "cmdoption-arg-all_tensors_to_one_file"]], "allow_tf32": [[4, "cmdoption-arg-171"], [4, "cmdoption-arg-allow_tf32"]], "approach": [[4, "cmdoption-arg-101"], [4, "cmdoption-arg-126"], [4, "cmdoption-arg-approach"]], "atol": [[4, "cmdoption-arg-atol"]], "backend": [[4, "cmdoption-arg-103"], [4, "cmdoption-arg-128"], [4, "cmdoption-arg-backend"]], "batch_size": [[4, "cmdoption-arg-114"], [4, "cmdoption-arg-139"], [4, "cmdoption-arg-183"], [4, "cmdoption-arg-211"], [4, "cmdoption-arg-46"], [4, "cmdoption-arg-73"], [4, "cmdoption-arg-batch_size"]], "bias": [[4, "cmdoption-arg-168"], [4, "cmdoption-arg-bias"]], "blocksize": [[4, "cmdoption-arg-blocksize"]], "calibrate_method": [[4, "cmdoption-arg-220"], [4, "cmdoption-arg-77"], [4, "cmdoption-arg-calibrate_method"]], "calibration_sampling_size": [[4, "cmdoption-arg-144"], [4, "cmdoption-arg-calibration_sampling_size"]], "checkpoint_path": [[4, "cmdoption-arg-checkpoint_path"]], "command line option": [[4, "cmdoption-arg-0"], [4, "cmdoption-arg-1"], [4, "cmdoption-arg-10"], [4, "cmdoption-arg-100"], [4, "cmdoption-arg-101"], [4, "cmdoption-arg-102"], [4, "cmdoption-arg-103"], [4, "cmdoption-arg-104"], [4, "cmdoption-arg-105"], [4, "cmdoption-arg-106"], [4, "cmdoption-arg-107"], [4, "cmdoption-arg-108"], [4, "cmdoption-arg-109"], [4, "cmdoption-arg-11"], [4, "cmdoption-arg-110"], [4, "cmdoption-arg-111"], [4, "cmdoption-arg-112"], [4, "cmdoption-arg-113"], [4, "cmdoption-arg-114"], [4, "cmdoption-arg-115"], [4, "cmdoption-arg-116"], [4, "cmdoption-arg-117"], [4, "cmdoption-arg-118"], [4, "cmdoption-arg-119"], [4, "cmdoption-arg-12"], [4, "cmdoption-arg-120"], [4, "cmdoption-arg-121"], [4, "cmdoption-arg-122"], [4, "cmdoption-arg-123"], [4, "cmdoption-arg-124"], [4, "cmdoption-arg-125"], [4, "cmdoption-arg-126"], [4, "cmdoption-arg-127"], [4, "cmdoption-arg-128"], [4, "cmdoption-arg-129"], [4, "cmdoption-arg-13"], [4, "cmdoption-arg-130"], [4, "cmdoption-arg-131"], [4, "cmdoption-arg-132"], [4, "cmdoption-arg-133"], [4, "cmdoption-arg-134"], [4, "cmdoption-arg-135"], [4, "cmdoption-arg-136"], [4, "cmdoption-arg-137"], [4, "cmdoption-arg-138"], [4, "cmdoption-arg-139"], [4, "cmdoption-arg-14"], [4, "cmdoption-arg-140"], [4, "cmdoption-arg-141"], [4, "cmdoption-arg-142"], [4, "cmdoption-arg-143"], [4, "cmdoption-arg-144"], [4, "cmdoption-arg-145"], [4, "cmdoption-arg-146"], [4, "cmdoption-arg-147"], [4, "cmdoption-arg-148"], [4, "cmdoption-arg-149"], [4, "cmdoption-arg-15"], [4, "cmdoption-arg-150"], [4, "cmdoption-arg-151"], [4, "cmdoption-arg-152"], [4, "cmdoption-arg-153"], [4, "cmdoption-arg-154"], [4, "cmdoption-arg-155"], [4, "cmdoption-arg-156"], [4, "cmdoption-arg-157"], [4, "cmdoption-arg-158"], [4, "cmdoption-arg-159"], [4, "cmdoption-arg-16"], [4, "cmdoption-arg-160"], [4, "cmdoption-arg-161"], [4, "cmdoption-arg-162"], [4, "cmdoption-arg-163"], [4, "cmdoption-arg-164"], [4, "cmdoption-arg-165"], [4, "cmdoption-arg-166"], [4, "cmdoption-arg-167"], [4, "cmdoption-arg-168"], [4, "cmdoption-arg-169"], [4, "cmdoption-arg-17"], [4, "cmdoption-arg-170"], [4, "cmdoption-arg-171"], [4, "cmdoption-arg-172"], [4, "cmdoption-arg-173"], [4, "cmdoption-arg-174"], [4, "cmdoption-arg-175"], [4, "cmdoption-arg-176"], [4, "cmdoption-arg-177"], [4, "cmdoption-arg-178"], [4, "cmdoption-arg-179"], [4, "cmdoption-arg-18"], [4, "cmdoption-arg-180"], [4, "cmdoption-arg-181"], [4, "cmdoption-arg-182"], [4, "cmdoption-arg-183"], [4, "cmdoption-arg-184"], [4, "cmdoption-arg-185"], [4, "cmdoption-arg-186"], [4, "cmdoption-arg-187"], [4, "cmdoption-arg-188"], [4, "cmdoption-arg-189"], [4, "cmdoption-arg-19"], [4, "cmdoption-arg-190"], [4, "cmdoption-arg-191"], [4, "cmdoption-arg-192"], [4, "cmdoption-arg-193"], [4, "cmdoption-arg-194"], [4, "cmdoption-arg-195"], [4, "cmdoption-arg-196"], [4, "cmdoption-arg-197"], [4, "cmdoption-arg-198"], [4, "cmdoption-arg-199"], [4, "cmdoption-arg-2"], [4, "cmdoption-arg-20"], [4, "cmdoption-arg-200"], [4, "cmdoption-arg-201"], [4, "cmdoption-arg-202"], [4, "cmdoption-arg-203"], [4, "cmdoption-arg-204"], [4, "cmdoption-arg-205"], [4, "cmdoption-arg-206"], [4, "cmdoption-arg-207"], [4, "cmdoption-arg-208"], [4, "cmdoption-arg-209"], [4, "cmdoption-arg-21"], [4, "cmdoption-arg-210"], [4, "cmdoption-arg-211"], [4, "cmdoption-arg-212"], [4, "cmdoption-arg-213"], [4, "cmdoption-arg-214"], [4, "cmdoption-arg-215"], [4, "cmdoption-arg-216"], [4, "cmdoption-arg-217"], [4, "cmdoption-arg-218"], [4, "cmdoption-arg-219"], [4, "cmdoption-arg-22"], [4, "cmdoption-arg-220"], [4, "cmdoption-arg-221"], [4, "cmdoption-arg-222"], [4, "cmdoption-arg-223"], [4, "cmdoption-arg-224"], [4, "cmdoption-arg-225"], [4, "cmdoption-arg-226"], [4, "cmdoption-arg-227"], [4, "cmdoption-arg-228"], [4, "cmdoption-arg-229"], [4, "cmdoption-arg-23"], [4, "cmdoption-arg-230"], [4, "cmdoption-arg-231"], [4, "cmdoption-arg-232"], [4, "cmdoption-arg-233"], [4, "cmdoption-arg-234"], [4, "cmdoption-arg-235"], [4, "cmdoption-arg-236"], [4, "cmdoption-arg-237"], [4, "cmdoption-arg-238"], [4, "cmdoption-arg-239"], [4, "cmdoption-arg-24"], [4, "cmdoption-arg-240"], [4, "cmdoption-arg-241"], [4, "cmdoption-arg-242"], [4, "cmdoption-arg-243"], [4, "cmdoption-arg-244"], [4, "cmdoption-arg-245"], [4, "cmdoption-arg-246"], [4, "cmdoption-arg-25"], [4, "cmdoption-arg-26"], [4, "cmdoption-arg-27"], [4, "cmdoption-arg-28"], [4, "cmdoption-arg-29"], [4, "cmdoption-arg-3"], [4, "cmdoption-arg-30"], [4, "cmdoption-arg-31"], [4, "cmdoption-arg-32"], [4, "cmdoption-arg-33"], [4, "cmdoption-arg-34"], [4, "cmdoption-arg-35"], [4, "cmdoption-arg-36"], [4, "cmdoption-arg-37"], [4, "cmdoption-arg-38"], [4, "cmdoption-arg-39"], [4, "cmdoption-arg-4"], [4, "cmdoption-arg-40"], [4, "cmdoption-arg-41"], [4, "cmdoption-arg-42"], [4, "cmdoption-arg-43"], [4, "cmdoption-arg-44"], [4, "cmdoption-arg-45"], [4, "cmdoption-arg-46"], [4, "cmdoption-arg-47"], [4, "cmdoption-arg-48"], [4, "cmdoption-arg-49"], [4, "cmdoption-arg-5"], [4, "cmdoption-arg-50"], [4, "cmdoption-arg-51"], [4, "cmdoption-arg-52"], [4, "cmdoption-arg-53"], [4, "cmdoption-arg-54"], [4, "cmdoption-arg-55"], [4, "cmdoption-arg-56"], [4, "cmdoption-arg-57"], [4, "cmdoption-arg-58"], [4, "cmdoption-arg-59"], [4, "cmdoption-arg-6"], [4, "cmdoption-arg-60"], [4, "cmdoption-arg-61"], [4, "cmdoption-arg-62"], [4, "cmdoption-arg-63"], [4, "cmdoption-arg-64"], [4, "cmdoption-arg-65"], [4, "cmdoption-arg-66"], [4, "cmdoption-arg-67"], [4, "cmdoption-arg-68"], [4, "cmdoption-arg-69"], [4, "cmdoption-arg-7"], [4, "cmdoption-arg-70"], [4, "cmdoption-arg-71"], [4, "cmdoption-arg-72"], [4, "cmdoption-arg-73"], [4, "cmdoption-arg-74"], [4, "cmdoption-arg-75"], [4, "cmdoption-arg-76"], [4, "cmdoption-arg-77"], [4, "cmdoption-arg-78"], [4, "cmdoption-arg-79"], [4, "cmdoption-arg-8"], [4, "cmdoption-arg-80"], [4, "cmdoption-arg-81"], [4, "cmdoption-arg-82"], [4, "cmdoption-arg-83"], [4, "cmdoption-arg-84"], [4, "cmdoption-arg-85"], [4, "cmdoption-arg-86"], [4, "cmdoption-arg-87"], [4, "cmdoption-arg-88"], [4, "cmdoption-arg-89"], [4, "cmdoption-arg-9"], [4, "cmdoption-arg-90"], [4, "cmdoption-arg-91"], [4, "cmdoption-arg-92"], [4, "cmdoption-arg-93"], [4, "cmdoption-arg-94"], [4, "cmdoption-arg-95"], [4, "cmdoption-arg-96"], [4, "cmdoption-arg-97"], [4, "cmdoption-arg-98"], [4, "cmdoption-arg-99"], [4, "cmdoption-arg-ActivationSymmetric"], [4, "cmdoption-arg-AddQDQPairToWeight"], [4, "cmdoption-arg-EnableSubgraph"], [4, "cmdoption-arg-ForceQuantizeNoInputCheck"], [4, "cmdoption-arg-MatMulConstBOnly"], [4, "cmdoption-arg-WeightSymmetric"], [4, "cmdoption-arg-activation_type"], [4, "cmdoption-arg-algorithms"], [4, "cmdoption-arg-all_tensors_to_one_file"], [4, "cmdoption-arg-allow_tf32"], [4, "cmdoption-arg-approach"], [4, "cmdoption-arg-atol"], [4, "cmdoption-arg-backend"], [4, "cmdoption-arg-batch_size"], [4, "cmdoption-arg-bias"], [4, "cmdoption-arg-blocksize"], [4, "cmdoption-arg-calibrate_method"], [4, "cmdoption-arg-calibration_sampling_size"], [4, "cmdoption-arg-checkpoint_path"], [4, "cmdoption-arg-compute_device"], [4, "cmdoption-arg-compute_dtype"], [4, "cmdoption-arg-convert_attribute"], [4, "cmdoption-arg-cpu_cores"], [4, "cmdoption-arg-data_config"], [4, "cmdoption-arg-data_dir"], [4, "cmdoption-arg-dataloader_func"], [4, "cmdoption-arg-dataloader_func_kwargs"], [4, "cmdoption-arg-device"], [4, "cmdoption-arg-disable_shape_infer"], [4, "cmdoption-arg-do_validate"], [4, "cmdoption-arg-domain"], [4, "cmdoption-arg-double_quant"], [4, "cmdoption-arg-enable_cuda_graph"], [4, "cmdoption-arg-enable_dpu"], [4, "cmdoption-arg-enable_htp"], [4, "cmdoption-arg-engine_config"], [4, "cmdoption-arg-eval_data_config"], [4, "cmdoption-arg-eval_dataset_size"], [4, "cmdoption-arg-excluded_precisions"], [4, "cmdoption-arg-execution_mode_list"], [4, "cmdoption-arg-external_data_name"], [4, "cmdoption-arg-extra.Sigmoid.nnapi"], [4, "cmdoption-arg-extra_args"], [4, "cmdoption-arg-extra_config"], [4, "cmdoption-arg-extra_options"], [4, "cmdoption-arg-extra_session_config"], [4, "cmdoption-arg-float16"], [4, "cmdoption-arg-force_fp16_inputs"], [4, "cmdoption-arg-force_fp32_nodes"], [4, "cmdoption-arg-force_fp32_ops"], [4, "cmdoption-arg-fp16"], [4, "cmdoption-arg-gpus"], [4, "cmdoption-arg-hidden_size"], [4, "cmdoption-arg-htp_socs"], [4, "cmdoption-arg-input"], [4, "cmdoption-arg-input_int32"], [4, "cmdoption-arg-input_layouts"], [4, "cmdoption-arg-input_names"], [4, "cmdoption-arg-input_nodes"], [4, "cmdoption-arg-input_shape"], [4, "cmdoption-arg-input_shapes"], [4, "cmdoption-arg-input_types"], [4, "cmdoption-arg-inter_thread_num_list"], [4, "cmdoption-arg-intra_thread_num_list"], [4, "cmdoption-arg-io_bind"], [4, "cmdoption-arg-keep_io_types"], [4, "cmdoption-arg-layer_name_filter"], [4, "cmdoption-arg-logger"], [4, "cmdoption-arg-lora_alpha"], [4, "cmdoption-arg-lora_dropout"], [4, "cmdoption-arg-lora_r"], [4, "cmdoption-arg-max_finite_val"], [4, "cmdoption-arg-max_layer"], [4, "cmdoption-arg-metric"], [4, "cmdoption-arg-metric_func"], [4, "cmdoption-arg-min_layer"], [4, "cmdoption-arg-min_positive_val"], [4, "cmdoption-arg-model_type"], [4, "cmdoption-arg-modules_to_fuse"], [4, "cmdoption-arg-modules_to_save"], [4, "cmdoption-arg-need_layer_fusing"], [4, "cmdoption-arg-no_post_process"], [4, "cmdoption-arg-no_repeat_ngram_size"], [4, "cmdoption-arg-node_block_list"], [4, "cmdoption-arg-nodes_to_exclude"], [4, "cmdoption-arg-nodes_to_quantize"], [4, "cmdoption-arg-num_epochs"], [4, "cmdoption-arg-num_heads"], [4, "cmdoption-arg-num_steps"], [4, "cmdoption-arg-only_onnxruntime"], [4, "cmdoption-arg-op_block_list"], [4, "cmdoption-arg-op_type_dict"], [4, "cmdoption-arg-op_types_to_quantize"], [4, "cmdoption-arg-opt_level"], [4, "cmdoption-arg-opt_level_list"], [4, "cmdoption-arg-optimization_options"], [4, "cmdoption-arg-optimize_model"], [4, "cmdoption-arg-ortmodule_onnx_opset_version"], [4, "cmdoption-arg-output_names"], [4, "cmdoption-arg-output_nodes"], [4, "cmdoption-arg-parallel_jobs"], [4, "cmdoption-arg-per_channel"], [4, "cmdoption-arg-percdamp"], [4, "cmdoption-arg-post"], [4, "cmdoption-arg-pre"], [4, "cmdoption-arg-providers_list"], [4, "cmdoption-arg-ptl_data_module"], [4, "cmdoption-arg-ptl_module"], [4, "cmdoption-arg-qconfig_func"], [4, "cmdoption-arg-quant_format"], [4, "cmdoption-arg-quant_level"], [4, "cmdoption-arg-quant_mode"], [4, "cmdoption-arg-quant_preprocess"], [4, "cmdoption-arg-quant_type"], [4, "cmdoption-arg-recipes"], [4, "cmdoption-arg-reduce_range"], [4, "cmdoption-arg-save_as_external_data"], [4, "cmdoption-arg-script_dir"], [4, "cmdoption-arg-seed"], [4, "cmdoption-arg-size_threshold"], [4, "cmdoption-arg-sparsity"], [4, "cmdoption-arg-strict"], [4, "cmdoption-arg-target_device"], [4, "cmdoption-arg-target_modules"], [4, "cmdoption-arg-target_opset"], [4, "cmdoption-arg-tool_command"], [4, "cmdoption-arg-tool_command_args"], [4, "cmdoption-arg-torch_dtype"], [4, "cmdoption-arg-train_batch_size"], [4, "cmdoption-arg-train_data_config"], [4, "cmdoption-arg-train_data_dir"], [4, "cmdoption-arg-train_dataloader_func"], [4, "cmdoption-arg-training_args"], [4, "cmdoption-arg-training_loop_func"], [4, "cmdoption-arg-trt_fp16_enable"], [4, "cmdoption-arg-tuning_criterion"], [4, "cmdoption-arg-use_device"], [4, "cmdoption-arg-use_dynamo_exporter"], [4, "cmdoption-arg-use_enhanced_quantizer"], [4, "cmdoption-arg-use_external_data_format"], [4, "cmdoption-arg-use_forced_decoder_ids"], [4, "cmdoption-arg-use_gpu"], [4, "cmdoption-arg-use_gqa"], [4, "cmdoption-arg-use_ort_trainer"], [4, "cmdoption-arg-user_script"], [4, "cmdoption-arg-val_data_dir"], [4, "cmdoption-arg-weight_only_config"], [4, "cmdoption-arg-weight_type"], [5, "cmdoption-arg-0"], [5, "cmdoption-arg-1"], [5, "cmdoption-arg-2"], [5, "cmdoption-arg-3"], [5, "cmdoption-arg-4"], [5, "cmdoption-arg-azureml_client"], [5, "cmdoption-arg-datastore_name"], [5, "cmdoption-arg-datastore_url"], [5, "cmdoption-arg-job_name"], [5, "cmdoption-arg-name"], [5, "cmdoption-arg-output_name"], [5, "cmdoption-arg-path"], [5, "cmdoption-arg-relative_path"], [5, "cmdoption-arg-version"], [6, "cmdoption-arg-0"], [6, "cmdoption-arg-1"], [6, "cmdoption-arg-group"], [6, "cmdoption-arg-multivariate"], [6, "cmdoption-arg-num_samples"], [6, "cmdoption-arg-seed"], [6, "cmdoption-arg-with_replacement"]], "compute_device": [[4, "cmdoption-arg-compute_device"]], "compute_dtype": [[4, "cmdoption-arg-compute_dtype"]], "convert_attribute": [[4, "cmdoption-arg-10"], [4, "cmdoption-arg-123"], [4, "cmdoption-arg-149"], [4, "cmdoption-arg-15"], [4, "cmdoption-arg-155"], [4, "cmdoption-arg-161"], [4, "cmdoption-arg-200"], [4, "cmdoption-arg-23"], [4, "cmdoption-arg-230"], [4, "cmdoption-arg-241"], [4, "cmdoption-arg-246"], [4, "cmdoption-arg-29"], [4, "cmdoption-arg-34"], [4, "cmdoption-arg-5"], [4, "cmdoption-arg-61"], [4, "cmdoption-arg-91"], [4, "cmdoption-arg-98"], [4, "cmdoption-arg-convert_attribute"]], "cpu_cores": [[4, "cmdoption-arg-cpu_cores"]], "create_training_args() (olive.passes.pytorch.lora.hftrainingarguments method)": [[4, "olive.passes.pytorch.lora.HFTrainingArguments.create_training_args"]], "data_config": [[4, "cmdoption-arg-117"], [4, "cmdoption-arg-142"], [4, "cmdoption-arg-184"], [4, "cmdoption-arg-193"], [4, "cmdoption-arg-201"], [4, "cmdoption-arg-206"], [4, "cmdoption-arg-49"], [4, "cmdoption-arg-76"], [4, "cmdoption-arg-data_config"]], "data_dir": [[4, "cmdoption-arg-113"], [4, "cmdoption-arg-138"], [4, "cmdoption-arg-182"], [4, "cmdoption-arg-190"], [4, "cmdoption-arg-210"], [4, "cmdoption-arg-45"], [4, "cmdoption-arg-72"], [4, "cmdoption-arg-data_dir"]], "data_seed (olive.passes.pytorch.lora.hftrainingarguments attribute)": [[4, "olive.passes.pytorch.lora.HFTrainingArguments.data_seed"]], "dataloader_func": [[4, "cmdoption-arg-115"], [4, "cmdoption-arg-140"], [4, "cmdoption-arg-180"], [4, "cmdoption-arg-191"], [4, "cmdoption-arg-212"], [4, "cmdoption-arg-47"], [4, "cmdoption-arg-74"], [4, "cmdoption-arg-dataloader_func"]], "dataloader_func_kwargs": [[4, "cmdoption-arg-116"], [4, "cmdoption-arg-141"], [4, "cmdoption-arg-181"], [4, "cmdoption-arg-192"], [4, "cmdoption-arg-213"], [4, "cmdoption-arg-48"], [4, "cmdoption-arg-75"], [4, "cmdoption-arg-dataloader_func_kwargs"]], "device": [[4, "cmdoption-arg-102"], [4, "cmdoption-arg-127"], [4, "cmdoption-arg-235"], [4, "cmdoption-arg-92"], [4, "cmdoption-arg-device"]], "disable_shape_infer": [[4, "cmdoption-arg-disable_shape_infer"]], "do_validate": [[4, "cmdoption-arg-do_validate"]], "domain": [[4, "cmdoption-arg-104"], [4, "cmdoption-arg-129"], [4, "cmdoption-arg-domain"]], "double_quant": [[4, "cmdoption-arg-double_quant"]], "enable_cuda_graph": [[4, "cmdoption-arg-enable_cuda_graph"]], "enable_dpu": [[4, "cmdoption-arg-enable_dpu"]], "enable_htp": [[4, "cmdoption-arg-enable_htp"]], "engine_config": [[4, "cmdoption-arg-engine_config"]], "eval_data_config": [[4, "cmdoption-arg-173"], [4, "cmdoption-arg-eval_data_config"]], "eval_dataset_size": [[4, "cmdoption-arg-174"], [4, "cmdoption-arg-eval_dataset_size"]], "eval_steps (olive.passes.pytorch.lora.hftrainingarguments attribute)": [[4, "olive.passes.pytorch.lora.HFTrainingArguments.eval_steps"]], "evaluation_strategy (olive.passes.pytorch.lora.hftrainingarguments attribute)": [[4, "olive.passes.pytorch.lora.HFTrainingArguments.evaluation_strategy"]], "excluded_precisions": [[4, "cmdoption-arg-108"], [4, "cmdoption-arg-133"], [4, "cmdoption-arg-excluded_precisions"]], "execution_mode_list": [[4, "cmdoption-arg-execution_mode_list"]], "external_data_name": [[4, "cmdoption-arg-121"], [4, "cmdoption-arg-13"], [4, "cmdoption-arg-147"], [4, "cmdoption-arg-153"], [4, "cmdoption-arg-159"], [4, "cmdoption-arg-198"], [4, "cmdoption-arg-21"], [4, "cmdoption-arg-228"], [4, "cmdoption-arg-239"], [4, "cmdoption-arg-244"], [4, "cmdoption-arg-27"], [4, "cmdoption-arg-3"], [4, "cmdoption-arg-32"], [4, "cmdoption-arg-59"], [4, "cmdoption-arg-8"], [4, "cmdoption-arg-89"], [4, "cmdoption-arg-96"], [4, "cmdoption-arg-external_data_name"]], "extra.sigmoid.nnapi": [[4, "cmdoption-arg-50"], [4, "cmdoption-arg-80"], [4, "cmdoption-arg-extra.Sigmoid.nnapi"]], "extra_args": [[4, "cmdoption-arg-194"], [4, "cmdoption-arg-236"], [4, "cmdoption-arg-extra_args"]], "extra_args (olive.passes.pytorch.lora.hftrainingarguments attribute)": [[4, "olive.passes.pytorch.lora.HFTrainingArguments.extra_args"]], "extra_config": [[4, "cmdoption-arg-extra_config"]], "extra_options": [[4, "cmdoption-arg-225"], [4, "cmdoption-arg-56"], [4, "cmdoption-arg-86"], [4, "cmdoption-arg-extra_options"]], "extra_session_config": [[4, "cmdoption-arg-extra_session_config"]], "float16": [[4, "cmdoption-arg-205"], [4, "cmdoption-arg-float16"]], "force_fp16_inputs": [[4, "cmdoption-arg-force_fp16_inputs"]], "force_fp32_nodes": [[4, "cmdoption-arg-force_fp32_nodes"]], "force_fp32_ops": [[4, "cmdoption-arg-force_fp32_ops"]], "fp16": [[4, "cmdoption-arg-234"], [4, "cmdoption-arg-fp16"]], "gpus": [[4, "cmdoption-arg-gpus"]], "gradient_accumulation_steps (olive.passes.pytorch.lora.hftrainingarguments attribute)": [[4, "olive.passes.pytorch.lora.HFTrainingArguments.gradient_accumulation_steps"]], "gradient_checkpointing (olive.passes.pytorch.lora.hftrainingarguments attribute)": [[4, "olive.passes.pytorch.lora.HFTrainingArguments.gradient_checkpointing"]], "group_by_length (olive.passes.pytorch.lora.hftrainingarguments attribute)": [[4, "olive.passes.pytorch.lora.HFTrainingArguments.group_by_length"]], "hidden_size": [[4, "cmdoption-arg-hidden_size"]], "htp_socs": [[4, "cmdoption-arg-htp_socs"]], "input": [[4, "cmdoption-arg-input"]], "input_int32": [[4, "cmdoption-arg-input_int32"]], "input_layouts": [[4, "cmdoption-arg-input_layouts"]], "input_names": [[4, "cmdoption-arg-185"], [4, "cmdoption-arg-input_names"]], "input_nodes": [[4, "cmdoption-arg-input_nodes"]], "input_shape": [[4, "cmdoption-arg-input_shape"]], "input_shapes": [[4, "cmdoption-arg-186"], [4, "cmdoption-arg-input_shapes"]], "input_types": [[4, "cmdoption-arg-187"], [4, "cmdoption-arg-input_types"]], "inter_thread_num_list": [[4, "cmdoption-arg-inter_thread_num_list"]], "intra_thread_num_list": [[4, "cmdoption-arg-intra_thread_num_list"]], "io_bind": [[4, "cmdoption-arg-io_bind"]], "keep_io_types": [[4, "cmdoption-arg-18"], [4, "cmdoption-arg-keep_io_types"]], "layer_name_filter": [[4, "cmdoption-arg-204"], [4, "cmdoption-arg-layer_name_filter"]], "learning_rate (olive.passes.pytorch.lora.hftrainingarguments attribute)": [[4, "olive.passes.pytorch.lora.HFTrainingArguments.learning_rate"]], "logger": [[4, "cmdoption-arg-logger"]], "logging_steps (olive.passes.pytorch.lora.hftrainingarguments attribute)": [[4, "olive.passes.pytorch.lora.HFTrainingArguments.logging_steps"]], "lora_alpha": [[4, "cmdoption-arg-166"], [4, "cmdoption-arg-lora_alpha"]], "lora_dropout": [[4, "cmdoption-arg-167"], [4, "cmdoption-arg-lora_dropout"]], "lora_r": [[4, "cmdoption-arg-165"], [4, "cmdoption-arg-lora_r"]], "lr_scheduler_type (olive.passes.pytorch.lora.hftrainingarguments attribute)": [[4, "olive.passes.pytorch.lora.HFTrainingArguments.lr_scheduler_type"]], "max_finite_val": [[4, "cmdoption-arg-max_finite_val"]], "max_layer": [[4, "cmdoption-arg-203"], [4, "cmdoption-arg-max_layer"]], "max_steps (olive.passes.pytorch.lora.hftrainingarguments attribute)": [[4, "olive.passes.pytorch.lora.HFTrainingArguments.max_steps"]], "metric": [[4, "cmdoption-arg-110"], [4, "cmdoption-arg-135"], [4, "cmdoption-arg-metric"]], "metric_func": [[4, "cmdoption-arg-metric_func"]], "min_layer": [[4, "cmdoption-arg-202"], [4, "cmdoption-arg-min_layer"]], "min_positive_val": [[4, "cmdoption-arg-min_positive_val"]], "model_type": [[4, "cmdoption-arg-model_type"]], "modules_to_fuse": [[4, "cmdoption-arg-modules_to_fuse"]], "modules_to_save": [[4, "cmdoption-arg-169"], [4, "cmdoption-arg-modules_to_save"]], "need_layer_fusing": [[4, "cmdoption-arg-need_layer_fusing"]], "no_post_process": [[4, "cmdoption-arg-no_post_process"]], "no_repeat_ngram_size": [[4, "cmdoption-arg-no_repeat_ngram_size"]], "node_block_list": [[4, "cmdoption-arg-node_block_list"]], "nodes_to_exclude": [[4, "cmdoption-arg-217"], [4, "cmdoption-arg-41"], [4, "cmdoption-arg-68"], [4, "cmdoption-arg-nodes_to_exclude"]], "nodes_to_quantize": [[4, "cmdoption-arg-216"], [4, "cmdoption-arg-40"], [4, "cmdoption-arg-67"], [4, "cmdoption-arg-nodes_to_quantize"]], "num_epochs": [[4, "cmdoption-arg-num_epochs"]], "num_heads": [[4, "cmdoption-arg-num_heads"]], "num_steps": [[4, "cmdoption-arg-num_steps"]], "only_onnxruntime": [[4, "cmdoption-arg-only_onnxruntime"]], "op_block_list": [[4, "cmdoption-arg-24"], [4, "cmdoption-arg-op_block_list"]], "op_type_dict": [[4, "cmdoption-arg-112"], [4, "cmdoption-arg-137"], [4, "cmdoption-arg-op_type_dict"]], "op_types_to_quantize": [[4, "cmdoption-arg-215"], [4, "cmdoption-arg-39"], [4, "cmdoption-arg-66"], [4, "cmdoption-arg-op_types_to_quantize"]], "opt_level": [[4, "cmdoption-arg-opt_level"]], "opt_level_list": [[4, "cmdoption-arg-opt_level_list"]], "optim (olive.passes.pytorch.lora.hftrainingarguments attribute)": [[4, "olive.passes.pytorch.lora.HFTrainingArguments.optim"]], "optimization_options": [[4, "cmdoption-arg-optimization_options"]], "optimize_model": [[4, "cmdoption-arg-optimize_model"]], "ortmodule_onnx_opset_version": [[4, "cmdoption-arg-164"], [4, "cmdoption-arg-ortmodule_onnx_opset_version"]], "output_dir (olive.passes.pytorch.lora.hftrainingarguments attribute)": [[4, "olive.passes.pytorch.lora.HFTrainingArguments.output_dir"]], "output_names": [[4, "cmdoption-arg-output_names"]], "output_nodes": [[4, "cmdoption-arg-output_nodes"]], "parallel_jobs": [[4, "cmdoption-arg-parallel_jobs"]], "per_channel": [[4, "cmdoption-arg-218"], [4, "cmdoption-arg-42"], [4, "cmdoption-arg-69"], [4, "cmdoption-arg-per_channel"]], "per_device_eval_batch_size (olive.passes.pytorch.lora.hftrainingarguments attribute)": [[4, "olive.passes.pytorch.lora.HFTrainingArguments.per_device_eval_batch_size"]], "per_device_train_batch_size (olive.passes.pytorch.lora.hftrainingarguments attribute)": [[4, "olive.passes.pytorch.lora.HFTrainingArguments.per_device_train_batch_size"]], "percdamp": [[4, "cmdoption-arg-percdamp"]], "post": [[4, "cmdoption-arg-post"]], "pre": [[4, "cmdoption-arg-pre"]], "providers_list": [[4, "cmdoption-arg-providers_list"]], "ptl_data_module": [[4, "cmdoption-arg-ptl_data_module"]], "ptl_module": [[4, "cmdoption-arg-ptl_module"]], "qconfig_func": [[4, "cmdoption-arg-qconfig_func"]], "quant_format": [[4, "cmdoption-arg-118"], [4, "cmdoption-arg-143"], [4, "cmdoption-arg-221"], [4, "cmdoption-arg-78"], [4, "cmdoption-arg-quant_format"]], "quant_level": [[4, "cmdoption-arg-107"], [4, "cmdoption-arg-132"], [4, "cmdoption-arg-quant_level"]], "quant_mode": [[4, "cmdoption-arg-209"], [4, "cmdoption-arg-37"], [4, "cmdoption-arg-64"], [4, "cmdoption-arg-quant_mode"]], "quant_preprocess": [[4, "cmdoption-arg-219"], [4, "cmdoption-arg-44"], [4, "cmdoption-arg-71"], [4, "cmdoption-arg-quant_preprocess"]], "quant_type": [[4, "cmdoption-arg-quant_type"]], "recipes": [[4, "cmdoption-arg-105"], [4, "cmdoption-arg-130"], [4, "cmdoption-arg-recipes"]], "reduce_range": [[4, "cmdoption-arg-106"], [4, "cmdoption-arg-131"], [4, "cmdoption-arg-43"], [4, "cmdoption-arg-70"], [4, "cmdoption-arg-93"], [4, "cmdoption-arg-reduce_range"]], "report_to (olive.passes.pytorch.lora.hftrainingarguments attribute)": [[4, "olive.passes.pytorch.lora.HFTrainingArguments.report_to"]], "save_as_external_data": [[4, "cmdoption-arg-1"], [4, "cmdoption-arg-11"], [4, "cmdoption-arg-119"], [4, "cmdoption-arg-145"], [4, "cmdoption-arg-151"], [4, "cmdoption-arg-157"], [4, "cmdoption-arg-19"], [4, "cmdoption-arg-196"], [4, "cmdoption-arg-226"], [4, "cmdoption-arg-237"], [4, "cmdoption-arg-242"], [4, "cmdoption-arg-25"], [4, "cmdoption-arg-30"], [4, "cmdoption-arg-57"], [4, "cmdoption-arg-6"], [4, "cmdoption-arg-87"], [4, "cmdoption-arg-94"], [4, "cmdoption-arg-save_as_external_data"]], "script_dir": [[4, "cmdoption-arg-124"], [4, "cmdoption-arg-16"], [4, "cmdoption-arg-176"], [4, "cmdoption-arg-178"], [4, "cmdoption-arg-188"], [4, "cmdoption-arg-207"], [4, "cmdoption-arg-231"], [4, "cmdoption-arg-35"], [4, "cmdoption-arg-62"], [4, "cmdoption-arg-99"], [4, "cmdoption-arg-script_dir"]], "seed": [[4, "cmdoption-arg-seed"], [6, "cmdoption-arg-1"], [6, "cmdoption-arg-seed"]], "seed (olive.passes.pytorch.lora.hftrainingarguments attribute)": [[4, "olive.passes.pytorch.lora.HFTrainingArguments.seed"]], "size_threshold": [[4, "cmdoption-arg-122"], [4, "cmdoption-arg-14"], [4, "cmdoption-arg-148"], [4, "cmdoption-arg-154"], [4, "cmdoption-arg-160"], [4, "cmdoption-arg-199"], [4, "cmdoption-arg-22"], [4, "cmdoption-arg-229"], [4, "cmdoption-arg-240"], [4, "cmdoption-arg-245"], [4, "cmdoption-arg-28"], [4, "cmdoption-arg-33"], [4, "cmdoption-arg-4"], [4, "cmdoption-arg-60"], [4, "cmdoption-arg-9"], [4, "cmdoption-arg-90"], [4, "cmdoption-arg-97"], [4, "cmdoption-arg-size_threshold"]], "sparsity": [[4, "cmdoption-arg-sparsity"]], "strict": [[4, "cmdoption-arg-strict"]], "target_device": [[4, "cmdoption-arg-target_device"]], "target_modules": [[4, "cmdoption-arg-target_modules"]], "target_opset": [[4, "cmdoption-arg-0"], [4, "cmdoption-arg-150"], [4, "cmdoption-arg-195"], [4, "cmdoption-arg-233"], [4, "cmdoption-arg-target_opset"]], "tool_command": [[4, "cmdoption-arg-tool_command"]], "tool_command_args": [[4, "cmdoption-arg-tool_command_args"]], "torch_dtype": [[4, "cmdoption-arg-162"], [4, "cmdoption-arg-170"], [4, "cmdoption-arg-torch_dtype"]], "train_batch_size": [[4, "cmdoption-arg-train_batch_size"]], "train_data_config": [[4, "cmdoption-arg-172"], [4, "cmdoption-arg-train_data_config"]], "train_data_dir": [[4, "cmdoption-arg-train_data_dir"]], "train_dataloader_func": [[4, "cmdoption-arg-train_dataloader_func"]], "training_args": [[4, "cmdoption-arg-175"], [4, "cmdoption-arg-training_args"]], "training_loop_func": [[4, "cmdoption-arg-training_loop_func"]], "trt_fp16_enable": [[4, "cmdoption-arg-trt_fp16_enable"]], "tuning_criterion": [[4, "cmdoption-arg-109"], [4, "cmdoption-arg-134"], [4, "cmdoption-arg-tuning_criterion"]], "use_device": [[4, "cmdoption-arg-use_device"]], "use_dynamo_exporter": [[4, "cmdoption-arg-use_dynamo_exporter"]], "use_enhanced_quantizer": [[4, "cmdoption-arg-use_enhanced_quantizer"]], "use_external_data_format": [[4, "cmdoption-arg-use_external_data_format"]], "use_forced_decoder_ids": [[4, "cmdoption-arg-use_forced_decoder_ids"]], "use_gpu": [[4, "cmdoption-arg-156"], [4, "cmdoption-arg-use_gpu"]], "use_gqa": [[4, "cmdoption-arg-use_gqa"]], "use_ort_trainer": [[4, "cmdoption-arg-163"], [4, "cmdoption-arg-use_ort_trainer"]], "user_script": [[4, "cmdoption-arg-100"], [4, "cmdoption-arg-125"], [4, "cmdoption-arg-17"], [4, "cmdoption-arg-177"], [4, "cmdoption-arg-179"], [4, "cmdoption-arg-189"], [4, "cmdoption-arg-208"], [4, "cmdoption-arg-232"], [4, "cmdoption-arg-36"], [4, "cmdoption-arg-63"], [4, "cmdoption-arg-user_script"]], "val_data_dir": [[4, "cmdoption-arg-val_data_dir"]], "warmup_ratio (olive.passes.pytorch.lora.hftrainingarguments attribute)": [[4, "olive.passes.pytorch.lora.HFTrainingArguments.warmup_ratio"]], "weight_decay (olive.passes.pytorch.lora.hftrainingarguments attribute)": [[4, "olive.passes.pytorch.lora.HFTrainingArguments.weight_decay"]], "weight_only_config": [[4, "cmdoption-arg-111"], [4, "cmdoption-arg-136"], [4, "cmdoption-arg-weight_only_config"]], "weight_type": [[4, "cmdoption-arg-214"], [4, "cmdoption-arg-38"], [4, "cmdoption-arg-65"], [4, "cmdoption-arg-weight_type"]], "azuremldatastore (olive.resource_path.resourcetype attribute)": [[5, "olive.resource_path.ResourceType.AzureMLDatastore"]], "azuremljoboutput (olive.resource_path.resourcetype attribute)": [[5, "olive.resource_path.ResourceType.AzureMLJobOutput"]], "azuremlmodel (olive.resource_path.resourcetype attribute)": [[5, "olive.resource_path.ResourceType.AzureMLModel"]], "azuremlregistrymodel (olive.resource_path.resourcetype attribute)": [[5, "olive.resource_path.ResourceType.AzureMLRegistryModel"]], "localfile (olive.resource_path.resourcetype attribute)": [[5, "olive.resource_path.ResourceType.LocalFile"]], "localfolder (olive.resource_path.resourcetype attribute)": [[5, "olive.resource_path.ResourceType.LocalFolder"]], "resourcetype (class in olive.resource_path)": [[5, "olive.resource_path.ResourceType"]], "stringname (olive.resource_path.resourcetype attribute)": [[5, "olive.resource_path.ResourceType.StringName"]], "aml_config_path (olive.azureml.azureml_client.azuremlclientconfig attribute)": [[5, "olive.azureml.azureml_client.AzureMLClientConfig.aml_config_path"]], "azureml_client": [[5, "cmdoption-arg-2"], [5, "cmdoption-arg-3"], [5, "cmdoption-arg-azureml_client"]], "create_client() (olive.azureml.azureml_client.azuremlclientconfig method)": [[5, "olive.azureml.azureml_client.AzureMLClientConfig.create_client"]], "create_registry_client() (olive.azureml.azureml_client.azuremlclientconfig method)": [[5, "olive.azureml.azureml_client.AzureMLClientConfig.create_registry_client"]], "datastore_name": [[5, "cmdoption-arg-datastore_name"]], "datastore_url": [[5, "cmdoption-arg-datastore_url"]], "default_auth_params (olive.azureml.azureml_client.azuremlclientconfig attribute)": [[5, "olive.azureml.azureml_client.AzureMLClientConfig.default_auth_params"]], "get_workspace_config() (olive.azureml.azureml_client.azuremlclientconfig method)": [[5, "olive.azureml.azureml_client.AzureMLClientConfig.get_workspace_config"]], "job_name": [[5, "cmdoption-arg-job_name"]], "max_operation_retries (olive.azureml.azureml_client.azuremlclientconfig attribute)": [[5, "olive.azureml.azureml_client.AzureMLClientConfig.max_operation_retries"]], "name": [[5, "cmdoption-arg-1"], [5, "cmdoption-arg-name"]], "operation_retry_interval (olive.azureml.azureml_client.azuremlclientconfig attribute)": [[5, "olive.azureml.azureml_client.AzureMLClientConfig.operation_retry_interval"]], "output_name": [[5, "cmdoption-arg-output_name"]], "path": [[5, "cmdoption-arg-0"], [5, "cmdoption-arg-path"]], "read_timeout (olive.azureml.azureml_client.azuremlclientconfig attribute)": [[5, "olive.azureml.azureml_client.AzureMLClientConfig.read_timeout"]], "relative_path": [[5, "cmdoption-arg-4"], [5, "cmdoption-arg-relative_path"]], "resource_group (olive.azureml.azureml_client.azuremlclientconfig attribute)": [[5, "olive.azureml.azureml_client.AzureMLClientConfig.resource_group"]], "subscription_id (olive.azureml.azureml_client.azuremlclientconfig attribute)": [[5, "olive.azureml.azureml_client.AzureMLClientConfig.subscription_id"]], "version": [[5, "cmdoption-arg-version"]], "workspace_name (olive.azureml.azureml_client.azuremlclientconfig attribute)": [[5, "olive.azureml.azureml_client.AzureMLClientConfig.workspace_name"]], "group": [[6, "cmdoption-arg-group"]], "multivariate": [[6, "cmdoption-arg-multivariate"]], "num_samples": [[6, "cmdoption-arg-0"], [6, "cmdoption-arg-num_samples"]], "with_replacement": [[6, "cmdoption-arg-with_replacement"]], "azureml (olive.systems.common.systemtype attribute)": [[7, "olive.systems.common.SystemType.AzureML"]], "azuremlsystem (class in olive.systems.azureml)": [[7, "olive.systems.azureml.AzureMLSystem"]], "azurend12ssystem (class in olive.systems.system_alias)": [[7, "olive.systems.system_alias.AzureND12SSystem"]], "azurend24rssystem (class in olive.systems.system_alias)": [[7, "olive.systems.system_alias.AzureND24RSSystem"]], "azurend24ssystem (class in olive.systems.system_alias)": [[7, "olive.systems.system_alias.AzureND24SSystem"]], "azurend6ssystem (class in olive.systems.system_alias)": [[7, "olive.systems.system_alias.AzureND6SSystem"]], "azurend96a100system (class in olive.systems.system_alias)": [[7, "olive.systems.system_alias.AzureND96A100System"]], "azurend96asystem (class in olive.systems.system_alias)": [[7, "olive.systems.system_alias.AzureND96ASystem"]], "azurendv2system (class in olive.systems.system_alias)": [[7, "olive.systems.system_alias.AzureNDV2System"]], "docker (olive.systems.common.systemtype attribute)": [[7, "olive.systems.common.SystemType.Docker"]], "dockersystem (class in olive.systems.docker)": [[7, "olive.systems.docker.DockerSystem"]], "local (olive.systems.common.systemtype attribute)": [[7, "olive.systems.common.SystemType.Local"]], "localsystem (class in olive.systems.local)": [[7, "olive.systems.local.LocalSystem"]], "pythonenvironment (olive.systems.common.systemtype attribute)": [[7, "olive.systems.common.SystemType.PythonEnvironment"]], "pythonenvironmentsystem (class in olive.systems.python_environment)": [[7, "olive.systems.python_environment.PythonEnvironmentSystem"]], "surfaceprosystem1796 (class in olive.systems.system_alias)": [[7, "olive.systems.system_alias.SurfaceProSystem1796"]], "surfaceprosystem1807 (class in olive.systems.system_alias)": [[7, "olive.systems.system_alias.SurfaceProSystem1807"]], "systemtype (class in olive.systems.common)": [[7, "olive.systems.common.SystemType"]], "accelerators (olive.systems.system_alias.azurend12ssystem attribute)": [[7, "olive.systems.system_alias.AzureND12SSystem.accelerators"]], "accelerators (olive.systems.system_alias.azurend24rssystem attribute)": [[7, "olive.systems.system_alias.AzureND24RSSystem.accelerators"]], "accelerators (olive.systems.system_alias.azurend24ssystem attribute)": [[7, "olive.systems.system_alias.AzureND24SSystem.accelerators"]], "accelerators (olive.systems.system_alias.azurend6ssystem attribute)": [[7, "olive.systems.system_alias.AzureND6SSystem.accelerators"]], "accelerators (olive.systems.system_alias.azurend96a100system attribute)": [[7, "olive.systems.system_alias.AzureND96A100System.accelerators"]], "accelerators (olive.systems.system_alias.azurend96asystem attribute)": [[7, "olive.systems.system_alias.AzureND96ASystem.accelerators"]], "accelerators (olive.systems.system_alias.azurendv2system attribute)": [[7, "olive.systems.system_alias.AzureNDV2System.accelerators"]], "accelerators (olive.systems.system_alias.surfaceprosystem1796 attribute)": [[7, "olive.systems.system_alias.SurfaceProSystem1796.accelerators"]], "accelerators (olive.systems.system_alias.surfaceprosystem1807 attribute)": [[7, "olive.systems.system_alias.SurfaceProSystem1807.accelerators"]], "accelerators (olive.systems.system_config.localtargetuserconfig attribute)": [[7, "olive.systems.system_config.LocalTargetUserConfig.accelerators"]], "aml_compute (olive.systems.system_config.azuremltargetuserconfig attribute)": [[7, "olive.systems.system_config.AzureMLTargetUserConfig.aml_compute"]], "aml_docker_config (olive.systems.system_config.azuremltargetuserconfig attribute)": [[7, "olive.systems.system_config.AzureMLTargetUserConfig.aml_docker_config"]], "azureml_client_config (olive.systems.system_config.azuremltargetuserconfig attribute)": [[7, "olive.systems.system_config.AzureMLTargetUserConfig.azureml_client_config"]], "base_image (olive.systems.azureml.azuremldockerconfig attribute)": [[7, "olive.systems.azureml.AzureMLDockerConfig.base_image"]], "base_image (olive.systems.docker.localdockerconfig attribute)": [[7, "olive.systems.docker.LocalDockerConfig.base_image"]], "build_args (olive.systems.docker.localdockerconfig attribute)": [[7, "olive.systems.docker.LocalDockerConfig.build_args"]], "build_context_path (olive.systems.azureml.azuremldockerconfig attribute)": [[7, "olive.systems.azureml.AzureMLDockerConfig.build_context_path"]], "build_context_path (olive.systems.docker.localdockerconfig attribute)": [[7, "olive.systems.docker.LocalDockerConfig.build_context_path"]], "conda_file_path (olive.systems.azureml.azuremldockerconfig attribute)": [[7, "olive.systems.azureml.AzureMLDockerConfig.conda_file_path"]], "config (olive.systems.system_config.systemconfig attribute)": [[7, "olive.systems.system_config.SystemConfig.config"]], "create_system() (olive.systems.system_config.systemconfig method)": [[7, "olive.systems.system_config.SystemConfig.create_system"]], "dockerfile (olive.systems.azureml.azuremldockerconfig attribute)": [[7, "olive.systems.azureml.AzureMLDockerConfig.dockerfile"]], "dockerfile (olive.systems.docker.localdockerconfig attribute)": [[7, "olive.systems.docker.LocalDockerConfig.dockerfile"]], "environment_variables (olive.systems.system_config.pythonenvironmenttargetuserconfig attribute)": [[7, "olive.systems.system_config.PythonEnvironmentTargetUserConfig.environment_variables"]], "image_name (olive.systems.docker.localdockerconfig attribute)": [[7, "olive.systems.docker.LocalDockerConfig.image_name"]], "instance_count (olive.systems.system_config.azuremltargetuserconfig attribute)": [[7, "olive.systems.system_config.AzureMLTargetUserConfig.instance_count"]], "is_dev (olive.systems.system_config.azuremltargetuserconfig attribute)": [[7, "olive.systems.system_config.AzureMLTargetUserConfig.is_dev"]], "is_dev (olive.systems.system_config.dockertargetuserconfig attribute)": [[7, "olive.systems.system_config.DockerTargetUserConfig.is_dev"]], "local_docker_config (olive.systems.system_config.dockertargetuserconfig attribute)": [[7, "olive.systems.system_config.DockerTargetUserConfig.local_docker_config"]], "module": [[7, "module-olive.systems.system_alias"]], "num_cpus (olive.systems.system_alias.azurend12ssystem attribute)": [[7, "olive.systems.system_alias.AzureND12SSystem.num_cpus"]], "num_cpus (olive.systems.system_alias.azurend24rssystem attribute)": [[7, "olive.systems.system_alias.AzureND24RSSystem.num_cpus"]], "num_cpus (olive.systems.system_alias.azurend24ssystem attribute)": [[7, "olive.systems.system_alias.AzureND24SSystem.num_cpus"]], "num_cpus (olive.systems.system_alias.azurend6ssystem attribute)": [[7, "olive.systems.system_alias.AzureND6SSystem.num_cpus"]], "num_cpus (olive.systems.system_alias.azurend96a100system attribute)": [[7, "olive.systems.system_alias.AzureND96A100System.num_cpus"]], "num_cpus (olive.systems.system_alias.azurend96asystem attribute)": [[7, "olive.systems.system_alias.AzureND96ASystem.num_cpus"]], "num_cpus (olive.systems.system_alias.azurendv2system attribute)": [[7, "olive.systems.system_alias.AzureNDV2System.num_cpus"]], "num_gpus (olive.systems.system_alias.azurend12ssystem attribute)": [[7, "olive.systems.system_alias.AzureND12SSystem.num_gpus"]], "num_gpus (olive.systems.system_alias.azurend24rssystem attribute)": [[7, "olive.systems.system_alias.AzureND24RSSystem.num_gpus"]], "num_gpus (olive.systems.system_alias.azurend24ssystem attribute)": [[7, "olive.systems.system_alias.AzureND24SSystem.num_gpus"]], "num_gpus (olive.systems.system_alias.azurend6ssystem attribute)": [[7, "olive.systems.system_alias.AzureND6SSystem.num_gpus"]], "num_gpus (olive.systems.system_alias.azurend96a100system attribute)": [[7, "olive.systems.system_alias.AzureND96A100System.num_gpus"]], "num_gpus (olive.systems.system_alias.azurend96asystem attribute)": [[7, "olive.systems.system_alias.AzureND96ASystem.num_gpus"]], "num_gpus (olive.systems.system_alias.azurendv2system attribute)": [[7, "olive.systems.system_alias.AzureNDV2System.num_gpus"]], "olive.systems.system_alias": [[7, "module-olive.systems.system_alias"]], "olive_managed_env (olive.systems.system_config.azuremltargetuserconfig attribute)": [[7, "olive.systems.system_config.AzureMLTargetUserConfig.olive_managed_env"]], "olive_managed_env (olive.systems.system_config.dockertargetuserconfig attribute)": [[7, "olive.systems.system_config.DockerTargetUserConfig.olive_managed_env"]], "olive_managed_env (olive.systems.system_config.pythonenvironmenttargetuserconfig attribute)": [[7, "olive.systems.system_config.PythonEnvironmentTargetUserConfig.olive_managed_env"]], "prepend_to_path (olive.systems.system_config.pythonenvironmenttargetuserconfig attribute)": [[7, "olive.systems.system_config.PythonEnvironmentTargetUserConfig.prepend_to_path"]], "python_environment_path (olive.systems.system_config.pythonenvironmenttargetuserconfig attribute)": [[7, "olive.systems.system_config.PythonEnvironmentTargetUserConfig.python_environment_path"]], "requirements_file (olive.systems.system_config.azuremltargetuserconfig attribute)": [[7, "olive.systems.system_config.AzureMLTargetUserConfig.requirements_file"]], "requirements_file (olive.systems.system_config.dockertargetuserconfig attribute)": [[7, "olive.systems.system_config.DockerTargetUserConfig.requirements_file"]], "requirements_file (olive.systems.system_config.pythonenvironmenttargetuserconfig attribute)": [[7, "olive.systems.system_config.PythonEnvironmentTargetUserConfig.requirements_file"]], "requirements_file_path (olive.systems.docker.localdockerconfig attribute)": [[7, "olive.systems.docker.LocalDockerConfig.requirements_file_path"]], "resources (olive.systems.system_config.azuremltargetuserconfig attribute)": [[7, "olive.systems.system_config.AzureMLTargetUserConfig.resources"]], "run_params (olive.systems.docker.localdockerconfig attribute)": [[7, "olive.systems.docker.LocalDockerConfig.run_params"]], "sku (olive.systems.system_alias.azurend12ssystem attribute)": [[7, "olive.systems.system_alias.AzureND12SSystem.sku"]], "sku (olive.systems.system_alias.azurend24rssystem attribute)": [[7, "olive.systems.system_alias.AzureND24RSSystem.sku"]], "sku (olive.systems.system_alias.azurend24ssystem attribute)": [[7, "olive.systems.system_alias.AzureND24SSystem.sku"]], "sku (olive.systems.system_alias.azurend6ssystem attribute)": [[7, "olive.systems.system_alias.AzureND6SSystem.sku"]], "sku (olive.systems.system_alias.azurend96a100system attribute)": [[7, "olive.systems.system_alias.AzureND96A100System.sku"]], "sku (olive.systems.system_alias.azurend96asystem attribute)": [[7, "olive.systems.system_alias.AzureND96ASystem.sku"]], "sku (olive.systems.system_alias.azurendv2system attribute)": [[7, "olive.systems.system_alias.AzureNDV2System.sku"]], "sku (olive.systems.system_alias.surfaceprosystem1796 attribute)": [[7, "olive.systems.system_alias.SurfaceProSystem1796.sku"]], "sku (olive.systems.system_alias.surfaceprosystem1807 attribute)": [[7, "olive.systems.system_alias.SurfaceProSystem1807.sku"]], "system_type (olive.systems.system_alias.azurend12ssystem attribute)": [[7, "olive.systems.system_alias.AzureND12SSystem.system_type"]], "system_type (olive.systems.system_alias.azurend24rssystem attribute)": [[7, "olive.systems.system_alias.AzureND24RSSystem.system_type"]], "system_type (olive.systems.system_alias.azurend24ssystem attribute)": [[7, "olive.systems.system_alias.AzureND24SSystem.system_type"]], "system_type (olive.systems.system_alias.azurend6ssystem attribute)": [[7, "olive.systems.system_alias.AzureND6SSystem.system_type"]], "system_type (olive.systems.system_alias.azurend96a100system attribute)": [[7, "olive.systems.system_alias.AzureND96A100System.system_type"]], "system_type (olive.systems.system_alias.azurend96asystem attribute)": [[7, "olive.systems.system_alias.AzureND96ASystem.system_type"]], "system_type (olive.systems.system_alias.azurendv2system attribute)": [[7, "olive.systems.system_alias.AzureNDV2System.system_type"]], "system_type (olive.systems.system_alias.surfaceprosystem1796 attribute)": [[7, "olive.systems.system_alias.SurfaceProSystem1796.system_type"]], "system_type (olive.systems.system_alias.surfaceprosystem1807 attribute)": [[7, "olive.systems.system_alias.SurfaceProSystem1807.system_type"]], "type (olive.systems.system_config.systemconfig attribute)": [[7, "olive.systems.system_config.SystemConfig.type"]]}})
\ No newline at end of file
+Search.setIndex({"docnames": ["api/engine", "api/evaluator", "api/metric", "api/models", "api/passes", "api/resource_path", "api/search-algorithms", "api/systems", "examples", "extending_olive/design", "extending_olive/how_to_add_optimization_pass", "features/azureml_integration", "features/custom_scripts", "features/huggingface_model_optimization", "features/model_transformations_and_optimizations", "features/packaging_output_models", "features/passes/onnx", "features/passes/openvino", "features/passes/pytorch", "features/passes/snpe", "getstarted/installation", "getstarted/quickstart_bert_example", "getstarted/quickstart_examples", "getstarted/quickstart_resnet_example", "index", "overview/olive", "overview/options", "overview/quicktour", "tutorials/advanced_users", "tutorials/azure_arc", "tutorials/azureml_scripts", "tutorials/configure_data", "tutorials/configure_metrics", "tutorials/configure_model_path", "tutorials/configure_pass", "tutorials/configure_systems"], "filenames": ["api/engine.rst", "api/evaluator.rst", "api/metric.rst", "api/models.rst", "api/passes.rst", "api/resource_path.rst", "api/search-algorithms.rst", "api/systems.rst", "examples.md", "extending_olive/design.md", "extending_olive/how_to_add_optimization_pass.md", "features/azureml_integration.md", "features/custom_scripts.md", "features/huggingface_model_optimization.md", "features/model_transformations_and_optimizations.rst", "features/packaging_output_models.md", "features/passes/onnx.md", "features/passes/openvino.md", "features/passes/pytorch.md", "features/passes/snpe.md", "getstarted/installation.md", "getstarted/quickstart_bert_example.md", "getstarted/quickstart_examples.rst", "getstarted/quickstart_resnet_example.md", "index.rst", "overview/olive.md", "overview/options.md", "overview/quicktour.md", "tutorials/advanced_users.md", "tutorials/azure_arc.md", "tutorials/azureml_scripts.md", "tutorials/configure_data.rst", "tutorials/configure_metrics.rst", "tutorials/configure_model_path.md", "tutorials/configure_pass.rst", "tutorials/configure_systems.rst"], "titles": ["Engine", "OliveEvaluator", "Metric", "OliveModels", "Passes", "ResourcePath", "SearchAlgorithms", "OliveSystems", "Acceleration on CPU", "Design", "How to add new optimization Pass", "Azure ML integration", "Custom Scripts", "Huggingface Model Optimization", "Model Transformations and Optimizations", "Packaging Olive artifacts", "ONNX", "OpenVINO", "PyTorch", "SNPE", "Installation", "BERT optimization with PTQ on CPU", "Quickstart Examples", "ResNet optimization with PTQ on CPU", "Welcome to Olive\u2019s documentation!", "Olive", "Olive Options", "Quick Tour", "Advanced User Tour", "Self-hosted Kubernetes cluster", "Azure ML scripts", "How To Configure Data", "How To Configure Metric", "How To Set Model Path", "How To Configure Pass", "How To Configure System"], "terms": {"class": [0, 1, 2, 3, 4, 5, 12, 26, 31, 32, 34, 35], "oliv": [0, 1, 2, 3, 4, 5, 6, 7, 9, 10, 12, 13, 14, 16, 18, 20, 21, 23, 28, 30, 31, 32, 33, 34, 35], "config": [0, 3, 4, 5, 9, 10, 11, 16, 17, 18, 19, 27, 28, 29, 30, 32, 33, 34, 35], "dict": [0, 3, 4, 5, 7, 10, 12, 13, 26], "str": [0, 2, 3, 4, 5, 7, 10, 12, 15, 26, 31], "ani": [0, 3, 4, 5, 7, 9, 10, 16, 26, 27, 31, 34], "none": [0, 2, 3, 4, 5, 7, 26, 32], "search_strategi": [0, 15, 26, 28], "host": [0, 9, 10, 13, 15, 24, 26, 35], "olivesystem": [0, 24, 26, 28], "target": [0, 4, 9, 15, 16, 25, 26, 27, 32, 35], "evaluator_config": [0, 28], "oliveevaluatorconfig": [0, 28], "execution_provid": [0, 10, 15, 26, 32], "list": [0, 2, 3, 4, 5, 6, 7, 9, 13, 16, 20, 26, 27, 28, 31, 34, 35], "sourc": [0, 1, 2, 3, 4, 5, 7, 19], "The": [0, 3, 4, 5, 6, 7, 9, 10, 13, 14, 15, 16, 17, 18, 19, 25, 26, 27, 28, 30, 31, 33, 35], "execut": [0, 4, 10, 16, 19, 26], "regist": [0, 9, 26, 33], "step": [0, 4, 10, 16, 26, 27, 29], "It": [0, 4, 9, 10, 15, 16, 17, 18, 19, 26, 27, 29, 34, 35], "facilit": 0, "evalu": [0, 1, 2, 4, 11, 12, 13, 15, 27, 31, 32, 35], "output": [0, 4, 5, 9, 10, 12, 14, 15, 16, 18, 21, 23, 25, 26, 27, 28, 31], "model": [0, 4, 5, 8, 9, 10, 15, 18, 24, 25, 31, 32, 35], "us": [0, 4, 6, 9, 10, 12, 13, 15, 16, 17, 18, 19, 20, 25, 26, 27, 28, 29, 31, 32, 33, 34, 35], "provid": [0, 4, 5, 9, 10, 12, 13, 14, 15, 16, 18, 19, 24, 25, 26, 27, 28, 30, 31, 32, 34], "criteria": 0, "produc": [0, 14, 27], "": [0, 4, 12, 18, 25, 26, 27, 28, 31, 34], "pass_typ": 0, "type": [0, 2, 3, 4, 5, 6, 7, 9, 10, 11, 12, 13, 15, 16, 17, 18, 19, 26, 27, 28, 31, 33, 34, 35], "pass": [0, 11, 12, 14, 15, 16, 17, 18, 19, 21, 23, 24, 29, 31, 35], "disable_search": [0, 10, 16, 26, 34], "fals": [0, 3, 4, 6, 7, 10, 15, 26, 28, 34, 35], "name": [0, 2, 4, 5, 6, 10, 11, 12, 13, 15, 16, 17, 26, 27, 28, 30, 31, 32], "clean_run_cach": [0, 26], "bool": [0, 3, 4, 6, 7, 10, 15], "output_nam": [0, 3, 4, 5, 11, 19, 26, 27, 28, 33], "configur": [0, 4, 5, 6, 9, 12, 13, 15, 24, 26, 27, 28, 33], "so": [0, 4, 10, 16], "could": [0, 4, 10, 14, 26, 27], "instanti": [0, 28], "later": 0, "run": [0, 4, 9, 11, 15, 16, 17, 18, 19, 26, 27, 29, 30, 31, 32, 35], "input_model_config": 0, "modelconfig": [0, 3, 28], "data_root": [0, 10, 26], "packaging_config": [0, 15, 26], "packagingconfig": [0, 15, 26], "output_dir": [0, 4, 15, 26], "evaluate_input_model": [0, 26], "true": [0, 2, 4, 5, 6, 10, 15, 16, 19, 26, 32, 34, 35], "all": [0, 4, 9, 16, 25, 26, 27, 28, 31, 34], "input": [0, 4, 9, 10, 11, 13, 14, 15, 16, 18, 19, 31], "one": [0, 4, 9, 10, 15, 18, 19, 27, 28, 30, 32], "more": [0, 4, 5, 6, 9, 13, 16, 17, 18, 19, 26, 27, 28, 31, 35], "candid": [0, 9, 15, 21, 23], "paramet": [0, 4, 5, 6, 9, 10, 16, 17, 18, 19, 26, 28, 31, 34], "data": [0, 4, 10, 13, 16, 24, 28, 32], "root": [0, 10, 11, 26, 33], "packag": [0, 9, 10, 21, 23, 24, 26, 27], "i": [0, 3, 4, 5, 6, 9, 10, 12, 13, 14, 16, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 29, 30, 31, 32, 33, 34, 35], "zip": [0, 15, 19], "file": [0, 4, 5, 10, 11, 12, 16, 17, 18, 19, 26, 27, 28, 29, 30], "directori": [0, 4, 9, 12, 19, 21, 23, 26, 27, 31, 32, 33], "save": [0, 4, 21, 23, 26, 33], "prefix": [0, 15, 26], "return": [0, 4, 9, 10, 12, 13, 26, 28, 32], "search": [0, 4, 6, 10, 14, 26, 28, 34], "strategi": [0, 4, 26], "ar": [0, 3, 4, 5, 6, 7, 9, 10, 11, 14, 15, 16, 17, 18, 25, 26, 28, 30, 35], "order": [0, 4, 15, 25, 26, 28], "thei": [0, 4, 15, 26, 31], "were": [0, 4, 15, 26], "final": [0, 4, 9, 10, 26, 27, 28], "_": [0, 31], "acceleratorspec": [0, 10], "_model": 0, "onnx": [0, 4, 9, 14, 15, 17, 19, 21, 23, 26, 27, 28, 35], "json": [0, 12, 15, 23, 27, 28, 30, 31, 32, 34, 35], "result": [0, 4, 16, 18, 26, 28, 32], "_metric": 0, "footprint": [0, 16, 17], "find": [0, 9, 16, 26, 27], "configbas": [0, 2], "can": [0, 4, 9, 10, 11, 12, 13, 14, 15, 16, 18, 19, 20, 21, 23, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35], "assign": [0, 4, 34], "dictionari": [0, 4, 9, 26, 27, 28, 31, 34], "kei": [0, 4, 12, 26, 31], "correspond": [0, 4, 16, 19, 21, 23], "field": [0, 2, 4, 5, 7, 10, 31, 32], "pydant": [0, 2, 4, 5, 7], "set": [0, 2, 4, 5, 7, 9, 10, 15, 16, 19, 24, 25, 26, 27, 28, 29, 34, 35], "searchstrategyconfig": 0, "systemconfig": [0, 7], "azureml_client_config": [0, 7], "azuremlclientconfig": [0, 5, 7], "cache_dir": [0, 15, 26, 28], "path": [0, 3, 4, 5, 7, 10, 11, 12, 19, 24, 26, 29, 30, 31], "cach": [0, 4, 9, 15, 26, 28], "clean_cach": [0, 15, 26], "clean_evaluation_cach": [0, 26], "plot_pareto_fronti": [0, 26], "execution_ord": [0, 9, 15, 26, 28], "requir": [0, 2, 4, 5, 7, 9, 10, 15, 16, 18, 25, 26, 28, 30, 31, 33, 34], "search_algorithm": [0, 9, 15, 26, 28], "search_algorithm_config": [0, 15, 26], "output_model_num": [0, 26], "int": [0, 3, 4, 5, 6, 7, 10, 26], "stop_when_goals_met": [0, 26], "max_it": [0, 26], "max_tim": [0, 26], "system": [0, 10, 11, 24], "system_config": [0, 7], "systemtyp": 0, "targetuserconfig": [0, 7], "create_system": [0, 7], "olive_evalu": [0, 1, 28], "metric": [0, 4, 9, 12, 15, 24, 26, 27, 28], "backend": [2, 4, 13, 26], "torch_metr": [2, 26], "sub_typ": [2, 12, 13, 26, 27, 28, 32], "submetr": 2, "user_config": [2, 12, 26, 28, 32], "data_config": [2, 4, 31], "dataconfig": [2, 4, 31], "get_sub_type_info": 2, "info_nam": 2, "no_priority_filt": 2, "callback": 2, "function": [2, 4, 12, 13, 24, 26, 28, 31, 32], "lambda": 2, "valu": [2, 4, 5, 7, 9, 10, 12, 15, 16, 18, 26, 28, 30, 31, 32, 34], "an": [2, 3, 4, 5, 7, 9, 10, 13, 14, 15, 16, 17, 18, 19, 25, 26, 27, 28, 30, 31, 32, 33, 35], "enumer": [2, 5, 7], "accuraci": [2, 4, 9, 12, 13, 16, 25, 26, 27], "custom": [2, 4, 8, 9, 16, 18, 24, 26], "latenc": [2, 4, 8, 9, 17, 25, 26, 27, 28], "throughput": [2, 9, 25, 26], "accuracy_scor": [2, 12, 26, 32], "auroc": [2, 12, 26, 32], "f1_score": [2, 12, 26, 32], "perplex": [2, 18], "precis": [2, 4, 14, 17, 18, 26], "recal": [2, 26], "avg": [2, 26, 27, 28, 32], "max": [2, 4, 5, 12, 26, 32], "min": [2, 4, 26, 32], "p50": 2, "p75": 2, "p90": 2, "p95": 2, "p99": 2, "p999": 2, "float": [2, 4, 16, 17, 26], "follow": [3, 4, 5, 6, 7, 9, 10, 11, 12, 13, 15, 19, 20, 25, 26, 27, 29, 31, 32], "avail": [3, 4, 5, 6, 7, 10, 11, 16, 19, 20, 26, 28, 31, 34, 35], "onnxmodel": [3, 4, 10, 17, 26], "model_path": [3, 11, 26, 27, 28, 33], "resourcepath": [3, 4, 24], "resourcepathconfig": [3, 4, 26], "onnx_file_nam": 3, "inference_set": [3, 26], "use_ort_extens": 3, "model_attribut": 3, "model_compon": 3, "model_component_nam": 3, "repres": [3, 10, 16, 28], "multipl": [3, 14, 15, 16, 25, 32], "compon": [3, 9, 16, 25, 26], "whisper": [3, 8, 13, 16], "exampl": [3, 4, 21, 23, 25, 27, 28, 31, 32, 34, 35], "composit": [3, 4], "ha": [3, 4, 9, 10, 20, 26, 28, 33], "encod": [3, 16], "decod": [3, 4, 13, 16], "collect": [3, 12], "model_name_pattern": 3, "num_rank": 3, "openvinomodel": [3, 4, 26], "pytorchmodel": [3, 4, 13, 17, 26, 27, 28, 31, 33], "model_file_format": 3, "modelfileformat": 3, "pytorch_entire_model": 3, "model_load": [3, 26], "callabl": [3, 4, 10, 26], "model_script": [3, 13, 26], "script_dir": [3, 4, 13, 26, 31], "io_config": [3, 13, 26, 27, 28], "ioconfig": [3, 26], "dummy_inputs_func": [3, 13, 26], "hf_config": [3, 4, 13, 26, 31], "hfconfig": 3, "adapter_path": 3, "snpemodel": [3, 4, 26], "input_nam": [3, 4, 19, 26, 27, 28, 31], "input_shap": [3, 4, 17, 19, 26, 27, 28, 31], "output_shap": [3, 19], "kwarg": [3, 26], "each": [4, 5, 6, 9, 10, 15, 16, 26, 27, 28, 31], "descript": [4, 5, 6, 10, 16, 26, 27], "option": [4, 5, 6, 9, 10, 11, 16, 24, 27, 28, 31, 34, 35], "convert": [4, 14, 16, 17, 18, 19, 26, 28, 31], "pytorch": [4, 8, 14, 16, 21, 26, 27, 28], "torch": [4, 16, 18, 27], "export": [4, 15, 26], "cpu": [4, 10, 11, 13, 17, 18, 20, 22, 24, 26, 27, 35], "compositeonnxmodel": 4, "distributedonnxmodel": 4, "contain": [4, 9, 10, 17, 19, 26, 31, 34, 35], "user": [4, 9, 10, 13, 15, 16, 24, 26, 31, 34, 35], "script": [4, 10, 24, 26, 28, 29, 31], "depend": [4, 10, 26, 28, 34, 35], "default_valu": [4, 5, 6, 10, 16, 34], "searchable_valu": [4, 10, 16, 34], "user_script": [4, 13, 16, 17, 18, 19, 26, 28, 31, 32, 34], "other": [4, 5, 9, 10, 13, 16, 26, 28, 29, 31, 34], "which": [4, 9, 10, 13, 15, 16, 17, 18, 26, 27, 28, 31], "object": [4, 9, 10, 12, 26, 27, 28], "import": [4, 10, 12, 21, 23, 27, 28, 31, 32, 34, 35], "from": [4, 6, 9, 10, 13, 15, 16, 18, 19, 21, 23, 26, 27, 28, 30, 31, 32, 33, 34, 35], "thi": [4, 6, 9, 10, 11, 12, 13, 15, 16, 17, 18, 19, 20, 21, 23, 24, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35], "target_opset": [4, 16, 26, 27, 28], "version": [4, 5, 11, 15, 17, 19, 20, 26, 33], "default": [4, 5, 8, 9, 10, 15, 16, 18, 20, 26, 27, 28, 29, 30, 31, 34], "ai": [4, 8, 17, 19, 20, 26, 27, 35], "opset": [4, 16], "13": [4, 16, 26, 27, 28], "use_dynamo_export": 4, "whether": [4, 10, 16, 26, 34], "dynamo_export": 4, "api": [4, 5, 25, 28], "use_devic": 4, "devic": [4, 9, 16, 17, 26, 27, 32, 35], "convers": [4, 9, 14, 21, 23, 27, 28], "e": [4, 13, 15, 16, 20, 26], "g": [4, 13, 15, 16], "cuda": [4, 8, 10, 27], "If": [4, 5, 6, 10, 11, 15, 16, 20, 26, 27, 30, 31, 32, 33], "specifi": [4, 10, 11, 12, 13, 15, 16, 18, 26, 27, 29, 30, 32, 33], "distributedpytorchmodel": 4, "torch_dtyp": 4, "dtype": 4, "cast": [4, 16], "befor": [4, 14, 16, 26, 29, 30, 31], "float32": [4, 16], "float16": [4, 14, 26], "parallel_job": 4, "number": [4, 5, 6, 15, 16, 26, 30, 31], "parallel": 4, "job": [4, 5, 26, 29], "0": [4, 11, 12, 15, 16, 17, 18, 26, 27, 28, 30, 32, 35], "disabl": 4, "save_as_external_data": 4, "serial": 4, "tensor": [4, 16, 18, 27], "separ": [4, 12, 20, 26], "instead": [4, 16, 26], "directli": [4, 12, 27, 28, 31, 33], "larg": [4, 18, 26], "2gb": 4, "mai": [4, 16, 20, 27, 28, 29], "forc": 4, "extern": 4, "regardless": 4, "all_tensors_to_one_fil": 4, "effect": 4, "onli": [4, 10, 12, 13, 15, 16, 18, 26, 30, 31, 32, 35], "external_data_nam": 4, "model_path_nam": 4, "size_threshold": 4, "threshold": [4, 26], "size": [4, 16, 17, 26, 30, 32], "when": [4, 6, 9, 12, 15, 17, 26, 28, 34, 35], "To": [4, 9, 10, 16, 23, 24], "everi": [4, 25], "raw": [4, 31], "1024": 4, "convert_attribut": 4, "non": 4, "attribut": [4, 12, 26], "latest": [4, 16, 20], "20": [4, 19, 26, 32], "optim": [4, 8, 9, 17, 18, 22, 24, 25, 26, 27, 28, 31], "fuse": [4, 16, 26], "node": [4, 16, 26, 30], "transform": [4, 17, 18, 21, 24, 26, 27], "base": [4, 10, 13, 15, 16, 18, 26, 31], "scenario": [4, 15, 16, 25, 26], "where": [4, 11, 12, 15, 16, 18, 26, 27, 30], "runtim": [4, 16, 19, 21, 26], "doe": [4, 6, 16, 26, 31], "appli": [4, 14, 16, 18, 26, 28], "load": [4, 12, 13, 16, 18, 19, 26, 27, 28, 31, 32], "time": [4, 16, 17, 26, 30], "onnxruntim": [4, 10, 15, 20, 26, 35], "model_typ": [4, 16, 26], "includ": [4, 10, 15, 16, 27, 31], "bert": [4, 8, 13, 16, 22, 26, 31], "gpt2": 4, "bert_tf": 4, "tf2onnx": 4, "bert_kera": 4, "keras2onnx": 4, "unet": 4, "vae": 4, "clip": 4, "stabl": [4, 6, 8, 20], "diffus": [4, 8], "num_head": [4, 26], "attent": 4, "head": [4, 13], "hidden_s": [4, 26], "hidden": 4, "optimization_opt": 4, "turn": [4, 9], "off": 4, "some": [4, 9, 10, 16, 24, 26, 34, 35], "fusion": [4, 16], "fusion_opt": 4, "fusionopt": 4, "opt_level": 4, "graph": [4, 16, 26], "level": [4, 16, 26, 27, 33], "1": [4, 6, 7, 11, 12, 13, 15, 16, 19, 26, 27, 28, 31, 32, 33, 35], "basic": [4, 16, 26], "2": [4, 7, 15, 16, 18, 26, 27, 28, 30, 31, 32, 35], "extend": [4, 26], "99": [4, 15], "categor": [4, 10], "use_gpu": 4, "flag": [4, 29, 30], "gpu": [4, 7, 10, 16, 18, 20, 24, 35], "infer": [4, 16, 17, 18, 19, 25, 26, 32, 33], "only_onnxruntim": 4, "python": [4, 5, 9, 12, 15, 19, 20, 21, 23, 26, 27, 28, 30, 31, 32, 34], "might": [4, 9, 19], "caus": [4, 26], "failur": 4, "symbol": 4, "shape": [4, 16, 26, 27], "condit": [4, 10, 16], "parent": [4, 10], "support": [4, 9, 10, 12, 13, 15, 16, 17, 18, 26, 27, 28, 33, 34, 35], "half": 4, "keep_io_typ": [4, 16], "keep": 4, "origin": [4, 17, 18], "force_fp32_op": 4, "oper": [4, 5, 9, 16, 17, 26], "force_fp32_nod": 4, "force_fp16_input": 4, "even": 4, "convert_float_to_float16": [4, 16], "tool": [4, 16, 19, 25, 26], "prefer": [4, 14], "them": [4, 12, 16, 19, 30, 32], "use_gqa": 4, "replac": [4, 6, 9, 26], "multiheadattent": 4, "groupqueryattent": 4, "input_int32": 4, "int32": [4, 16, 26], "data_dir": [4, 11, 12, 17, 19, 26, 28, 31, 32], "sampl": [4, 6, 9, 15, 26], "pathlib": [4, 5], "resource_path": [4, 5], "dataloader_func": [4, 12, 16, 17, 19, 26, 28, 32, 34], "dataload": [4, 12, 26, 28, 31], "given": [4, 25, 26, 31], "batch": [4, 26, 31, 32], "dataloader_func_kwarg": 4, "keyword": [4, 26, 28, 31], "argument": [4, 26, 28, 30, 31], "batch_siz": [4, 12, 13, 16, 26, 28, 31, 32], "comput": [4, 9, 16, 17, 19, 26, 29, 30, 35], "input_typ": [4, 26, 31], "select": [4, 9, 16, 23, 27, 29], "tune": [4, 9, 10, 14, 18, 21, 25, 26, 28], "process": [4, 8, 12, 14, 17, 18, 19, 26, 27, 28, 31], "cpu_cor": 4, "core": [4, 9, 19, 25], "thread": [4, 16], "io_bind": 4, "enabl": [4, 20, 25, 26], "iobind": 4, "enable_cuda_graph": 4, "providers_list": 4, "framework": [4, 16, 17, 19, 25, 28], "cpuexecutionprovid": [4, 10, 15], "execution_mode_list": 4, "between": [4, 5, 9, 11, 16, 26], "opt_level_list": 4, "trt_fp16_enabl": 4, "fp16": [4, 18], "mode": [4, 16, 20, 26, 27], "tensorrt": [4, 8, 10, 18], "intra_thread_num_list": 4, "intra": 4, "test": [4, 20, 26, 31], "inter_thread_num_list": 4, "inter": 4, "extra_session_config": [4, 15], "extra": [4, 20, 35], "session": 4, "dure": [4, 17, 18, 20, 26], "onnxconvert": 4, "common": [4, 7, 35], "see": [4, 16, 26, 27, 28, 29], "http": [4, 5, 6, 20, 26, 31], "doc": [4, 26], "perform": [4, 9, 14, 15, 17, 18, 21, 26], "html": [4, 6], "min_positive_v": 4, "constant": [4, 24], "against": 4, "1e": 4, "07": 4, "max_finite_v": 4, "10000": 4, "should": [4, 10, 12, 26, 29, 30, 31], "left": 4, "disable_shape_inf": 4, "skip": [4, 16, 26], "op_block_list": [4, 16], "op": [4, 14, 26], "leav": [4, 16], "node_block_list": 4, "mix": [4, 14], "simplifiedlayernorm": [4, 16], "skipsimplifiedlayernorm": [4, 16], "relu": [4, 16], "add": [4, 15, 16, 24, 33], "atol": 4, "absolut": [4, 26], "toler": 4, "check": [4, 16, 17, 18, 19, 34], "06": 4, "dynam": [4, 16, 26, 27], "quantiz": [4, 8, 9, 14, 21, 23, 26, 27, 28], "quant_mod": 4, "weight_typ": [4, 26, 28, 34], "weight": [4, 16, 17, 18, 19], "both": [4, 16, 26, 28, 32, 33], "static": [4, 10, 16, 26], "qint8": 4, "sign": 4, "8": [4, 7, 16, 17, 18, 19], "bit": [4, 16, 17, 18, 19], "integ": [4, 16, 17], "quint8": [4, 26, 28, 34], "unsign": 4, "op_types_to_quant": 4, "nodes_to_quant": 4, "nodes_to_exclud": 4, "exclud": [4, 16, 26], "per_channel": [4, 16, 34], "per": [4, 9], "channel": 4, "tip": 4, "reduce_rang": [4, 34], "reduc": [4, 16, 17, 18, 25], "rang": [4, 16], "7": 4, "improv": [4, 14, 16, 17, 18, 24, 26, 32], "vnni": 4, "machin": [4, 9, 11, 16, 19, 30, 33, 35], "especi": 4, "quant_preprocess": 4, "prepar": [4, 25], "pre": [4, 8, 14, 18, 24, 34, 35], "sigmoid": 4, "nnapi": 4, "activationsymmetr": 4, "symmetr": 4, "calibr": [4, 16], "activ": [4, 9, 13, 16, 17, 18, 20], "weightsymmetr": 4, "enablesubgraph": 4, "subgraph": 4, "current": [4, 9, 13, 24, 26, 31, 33], "forcequantizenoinputcheck": 4, "By": [4, 15, 26], "latent": 4, "like": [4, 5, 16, 18, 26, 27, 30, 31], "maxpool": 4, "transpos": 4, "do": [4, 10, 26], "alreadi": 4, "alwai": [4, 26], "gener": [4, 6, 15, 16, 19, 26, 33], "also": [4, 9, 10, 14, 15, 16, 18, 19, 20, 26, 27, 31, 33, 34, 35], "behavior": 4, "matmulconstbonli": 4, "matmul": 4, "const": 4, "b": [4, 16, 18], "conditionaldefault": [4, 10], "olive_invalid_param_valu": 4, "extra_opt": 4, "pair": 4, "pleas": [4, 5, 10, 11, 13, 16, 17, 18, 19, 20, 21, 23, 26, 27, 29, 32, 35], "refer": [4, 5, 6, 11, 13, 16, 17, 18, 19, 20, 25, 26, 27, 28, 31, 32, 35], "github": [4, 20, 31], "com": [4, 5, 11, 20, 26, 31, 35], "microsoft": [4, 5, 11, 20, 26, 29, 31, 35], "blob": [4, 31], "main": [4, 9, 20, 31], "py": [4, 12, 13, 16, 17, 18, 19, 23, 26, 28, 31, 32, 34], "detail": [4, 5, 6, 11, 13, 16, 17, 18, 19, 25, 26, 27, 28, 29, 35], "about": [4, 6, 10, 16, 17, 18, 19, 26, 27, 28], "overwritten": 4, "dataset": [4, 12, 16, 18, 26, 27, 31], "For": [4, 10, 11, 13, 15, 16, 26, 27, 28, 31, 34], "local": [4, 5, 7, 9, 11, 27, 28], "calibrate_method": 4, "method": [4, 10, 16, 17, 18, 26], "minmax": 4, "entropi": 4, "calibrationmethod": 4, "percentil": 4, "16": [4, 16, 18, 28, 32], "avoid": [4, 27, 31], "quant_format": 4, "qoper": 4, "format": [4, 14, 15, 16, 26], "qdq": 4, "insert": [4, 14, 17], "quantizelinear": 4, "dequantizelinear": 4, "activation_typ": 4, "specialparamvalu": 4, "invalid": [4, 10], "techniqu": [4, 9, 10, 16, 18, 25, 26, 27, 28], "ignor": [4, 5, 10, 26, 30, 31], "olive_ignored_param_valu": 4, "intel": [4, 8, 17, 26, 31], "neural": [4, 8, 17, 19, 26], "compressor": [4, 8, 26], "approach": [4, 17, 18, 28], "onnxrt_trt_ep": 4, "onnxrt_cuda_ep": 4, "domain": 4, "auto": [4, 9, 10, 28], "cv": 4, "object_detect": 4, "nlp": 4, "recommendation_system": 4, "adaptor": 4, "specif": [4, 9, 12, 13, 14, 16, 19, 25, 26, 28, 34], "differ": [4, 9, 12, 15, 16, 18, 19, 26, 27, 32, 35], "automat": [4, 11, 12, 13, 16, 26, 33], "explicitli": [4, 33], "overrid": [4, 26, 28], "detect": 4, "recip": 4, "below": 4, "smooth_quant": 4, "smooth": 4, "quant": 4, "smooth_quant_arg": 4, "fast_bias_correct": 4, "fast": 4, "bia": 4, "correct": 4, "weight_correct": 4, "gemm_to_matmul": 4, "gemm": 4, "valid": [4, 10, 13, 26, 31], "graph_optimization_level": [4, 15], "disable_al": 4, "enable_bas": 4, "enable_extend": 4, "enable_al": 4, "first_conv_or_matmul_quant": 4, "first": [4, 9, 21, 23, 26, 28, 31], "conv": 4, "last_conv_or_matmul_quant": 4, "last": [4, 27, 29], "pre_post_process_quant": 4, "preprocess": [4, 31], "postprocess": 4, "add_qdq_pair_to_weight": 4, "optypes_to_exclude_output_qu": 4, "don": [4, 10, 16, 19, 26], "t": [4, 10, 16, 19, 26, 33], "optyp": 4, "dedicated_qdq_pair": 4, "dedic": 4, "quant_level": 4, "allow": [4, 11, 17, 25], "choos": [4, 16], "3": [4, 5, 15, 17, 18, 19, 26, 27, 28, 31], "conserv": 4, "combin": [4, 9, 34], "master": 4, "tuning_strategi": 4, "md": 4, "algorithm": [4, 6, 17, 18, 26], "excluded_precis": 4, "empti": [4, 26], "fp32": 4, "bf16": 4, "int8": [4, 16], "you": [4, 11, 12, 13, 15, 16, 19, 20, 21, 23, 24, 26, 27, 28, 29, 30, 32, 33, 34], "want": [4, 16, 20, 26, 27, 28, 31], "tuning_criterion": 4, "instanc": [4, 5, 16, 26, 28, 30], "tuningcriterion": 4, "In": [4, 9, 11, 16, 26, 28, 29, 31, 32], "strategy_kwarg": 4, "timeout": [4, 5, 26], "max_trial": 4, "5": [4, 5, 10, 15, 18, 23, 26, 28], "awar": [4, 14, 25, 26], "weight_only_config": 4, "inc": 4, "op_type_dict": 4, "4": [4, 7, 10, 12, 16, 18, 26], "group_siz": 4, "scheme": 4, "asym": 4, "rtn": 4, "calibration_sampling_s": 4, "100": 4, "weight_onli": 4, "post": [4, 8, 12, 14, 26, 31], "command": [4, 20, 21, 23, 26, 27, 28, 29, 30], "tool_command": [4, 16], "invok": [4, 10], "tool_command_arg": [4, 16], "prepostprocessor": [4, 16], "schema": 4, "would": [4, 27, 31], "imag": [4, 16], "data_typ": [4, 16], "uint8": [4, 16], "num_byt": [4, 16], "append_pre_post_processing_op": 4, "prepostprocessorinput": [4, 16], "beam": [4, 14], "olivemodel": [4, 10, 13, 24, 28], "no_repeat_ngram_s": [4, 16], "ngram": 4, "occur": 4, "onc": [4, 16, 17], "use_forced_decoder_id": 4, "decoder_input_id": 4, "ort": [4, 14], "fine": [4, 16, 18], "hug": [4, 18], "face": [4, 18], "target_modul": 4, "modul": [4, 8, 10, 12, 18, 31], "use_ort_train": 4, "orttrain": 4, "ortmodule_onnx_opset_vers": 4, "bfloat16": [4, 18], "lora_r": 4, "dimens": [4, 16, 26], "64": [4, 15], "lora_alpha": [4, 18], "alpha": 4, "scale": [4, 16, 30], "lora_dropout": 4, "dropout": 4, "probabl": 4, "layer": [4, 18], "modules_to_sav": 4, "apart": 4, "trainabl": [4, 18], "checkpoint": 4, "train": [4, 8, 14, 25, 26], "allow_tf32": 4, "tf32": 4, "amper": 4, "speed": [4, 16], "up": [4, 25], "inform": [4, 6, 10, 17, 18, 28], "org": 4, "note": [4, 10, 17, 18, 20, 26, 28, 29, 31, 33], "tensorfloat": 4, "32": [4, 16, 17, 26, 27, 28], "train_data_config": [4, 18], "eval_data_config": 4, "eval_dataset_s": 4, "split": [4, 13, 26, 31], "eval": 4, "otherwis": [4, 26], "need": [4, 9, 13, 14, 16, 20, 26, 28, 31, 32], "either": [4, 12, 16, 26], "posit": [4, 26, 28, 31], "smaller": 4, "than": [4, 16, 28], "training_arg": [4, 18], "double_qu": 4, "nest": 4, "again": 4, "quant_typ": [4, 18], "fp4": 4, "nf4": [4, 18], "compute_dtyp": [4, 18], "same": [4, 9, 10, 15, 16, 19, 26], "trainer": 4, "trainingargu": 4, "recommend": [4, 15, 19, 20], "seed": [4, 6, 15, 26], "42": 4, "random": [4, 6, 9, 26], "initi": [4, 5, 9, 26, 28], "data_se": 4, "sampler": [4, 6], "paged_adamw_32bit": 4, "per_device_train_batch_s": 4, "per_device_eval_batch_s": 4, "gradient_accumulation_step": 4, "updat": [4, 24, 28, 31], "accumul": 4, "gradient": [4, 18], "backward": 4, "max_step": 4, "total": 4, "weight_decai": 4, "l2": 4, "decai": 4, "rate": 4, "adamw": 4, "learning_r": [4, 18], "0002": [4, 18], "learn": [4, 5, 11, 16, 17, 18, 19, 25, 30, 33], "gradient_checkpoint": 4, "lr_scheduler_typ": 4, "schedul": 4, "better": [4, 26], "cosin": 4, "advantag": [4, 18, 28], "analysi": 4, "warmup_ratio": 4, "03": 4, "fraction": 4, "warmup": 4, "logging_step": 4, "10": [4, 26], "two": [4, 9, 16, 34], "log": [4, 26], "evaluation_strategi": 4, "Will": 4, "eval_step": 4, "group_by_length": 4, "group": [4, 5, 6, 26, 30], "roughli": 4, "length": 4, "togeth": [4, 9, 16, 26], "report_to": 4, "integr": [4, 16, 24, 25], "report": 4, "dir": 4, "temp": 4, "extra_arg": 4, "create_training_arg": 4, "train_data_dir": 4, "val_data_dir": 4, "train_dataloader_func": [4, 18], "train_batch_s": 4, "training_loop_func": [4, 18], "loop": [4, 8, 18], "ptl_modul": [4, 18], "lightningmodul": 4, "lightn": [4, 8, 18], "wai": [4, 16, 18, 31, 32], "encapsul": 4, "logic": [4, 12], "relat": [4, 26], "readthedoc": [4, 6], "io": [4, 6, 13, 29], "en": [4, 5, 6], "lightning_modul": 4, "ptl_data_modul": [4, 18], "lightningdatamodul": 4, "datamodul": 4, "num_epoch": [4, 18, 23], "maximum": [4, 26, 30], "epoch": 4, "num_step": 4, "do_valid": 4, "over": [4, 6, 9, 26, 28], "after": [4, 5, 14, 21, 23, 26], "modules_to_fus": 4, "qconfig_func": 4, "creat": [4, 5, 9, 10, 12, 16, 20, 26, 28, 30, 31, 35], "qconfig": [4, 18], "qat": [4, 8, 18, 26], "ao": 4, "logger": 4, "pytorch_lightn": 4, "iter": [4, 9, 26], "checkpoint_path": 4, "tensorflow": [4, 16, 17, 19, 26], "openvino": [4, 8, 14, 26, 27], "tupl": 4, "fed": 4, "defin": [4, 9, 11, 12, 13, 16, 31, 32, 34], "comma": 4, "enclos": 4, "parenthes": 4, "squar": 4, "bracket": 4, "227": 4, "extra_config": 4, "mo": 4, "usag": [4, 18, 24], "instruct": [4, 11, 19, 25, 29], "openvino_docs_mo_dg_deep_learning_model_optimizer_devguid": 4, "pot_introduct": 4, "engine_config": [4, 17, 28], "pot": 4, "ieengin": 4, "metric_func": [4, 12, 26, 32], "A": [4, 9, 30, 35], "calcul": [4, 16, 32], "pipelin": [4, 9, 21, 26], "determin": [4, 32], "defaultquant": [4, 17], "param": [4, 10, 16, 17, 31], "preset": [4, 17], "stat_subset_s": [4, 17], "500": 4, "snpe": [4, 14, 26, 27, 31], "dlc": [4, 19, 26], "sdk": [4, 14, 26], "tensorflowmodel": [4, 17], "must": [4, 9, 10, 16, 26, 31, 34, 35], "member": 4, "inputtyp": 4, "input_layout": 4, "layout": [4, 16], "inputlayout": 4, "develop": [4, 13, 16, 19, 20, 25], "qualcomm": [4, 8, 19], "site": 4, "addit": [4, 16, 17, 20, 27, 31, 33], "form": [4, 13, 16, 26], "arg_nam": 4, "arg_valu": 4, "take": [4, 10, 13, 18, 25, 26, 27, 28, 29, 31, 32, 34], "snpedataload": 4, "use_enhanced_quant": 4, "enhanc": 4, "featur": [4, 20, 26, 27, 28, 35], "have": [4, 9, 11, 12, 15, 16, 19, 26, 27, 32, 35], "long": [4, 26], "tail": 4, "distribut": [4, 17], "being": 4, "enable_htp": [4, 19], "pack": 4, "htp": 4, "htp_soc": 4, "soc": 4, "offlin": [4, 16], "tools_snp": 4, "target_devic": [4, 17], "snpedevic": 4, "12": [4, 7, 26], "arxiv": 4, "ab": 4, "2301": 4, "00774": 4, "bloom": [4, 18], "gpt_neox": 4, "llama": 4, "opt": [4, 18], "sparsiti": [4, 18], "n": 4, "m": [4, 9, 19, 21, 23, 26, 27, 28, 30], "semi": [4, 18], "structur": [4, 6, 9, 16, 18, 26], "pattern": [4, 16, 18], "nvidia": 4, "blog": [4, 18], "acceler": [4, 7, 10, 16, 18, 19, 24, 25, 35], "blocksiz": 4, "adapt": [4, 18], "mask": 4, "128": [4, 31], "percdamp": 4, "percentag": [4, 26], "averag": 4, "hessian": 4, "diagon": 4, "dampen": 4, "01": [4, 12, 26, 32], "min_lay": 4, "prune": [4, 16, 18], "id": [4, 5, 11, 26, 27, 30, 33], "max_lay": 4, "layer_name_filt": 4, "whose": 4, "string": [4, 5, 10, 16, 26], "compute_devic": 4, "etc": [4, 10, 16, 26, 27], "affect": 4, "expect": [4, 19], "most": [4, 16, 25], "sequenc": 4, "nn": [4, 18], "linear": [4, 18], "huggingfac": [4, 24, 26, 27, 31], "spars": [4, 18], "applic": [4, 18], "entir": [4, 26], "instal": [4, 10, 21, 23, 24, 27, 29, 35], "compil": [4, 18, 25], "we": [4, 9, 13, 19, 20, 25, 26, 27, 28, 29, 31, 34], "best": [4, 9, 16, 21, 23, 25, 26, 28, 32, 34, 35], "vai_q_onnx": 4, "viti": [4, 8, 26], "input_nod": 4, "start": [4, 25, 28, 31], "output_nod": 4, "end": 4, "optimize_model": 4, "deprec": 4, "soon": [4, 28], "NOT": 4, "chang": [4, 27], "make": [4, 25, 29], "debug": 4, "loss": 4, "difficult": 4, "use_external_data_format": 4, "nonoverflow": 4, "minms": 4, "need_layer_fus": 4, "enable_dpu": 4, "dpu": [4, 24], "addqdqpairtoweight": 4, "remain": 4, "point": [4, 6, 9, 10, 16, 17, 19, 26], "optimum": [4, 26], "optimummodel": 4, "14": [4, 16], "no_post_process": 4, "main_export": 4, "merg": [4, 16, 18, 26], "decoder_model": 4, "its": [4, 5, 6, 9, 16, 17, 18, 19, 26, 32], "decoder_with_past_model": 4, "via": [4, 11, 26], "librari": [4, 16, 18, 26], "strict": 4, "decoder_with_past": 4, "strictli": 4, "case": [4, 16, 21, 23, 26, 31, 34], "ad": [4, 12], "match": 4, "resourc": [5, 7, 11, 26, 30, 33], "azureml_datastor": [5, 11, 26, 33], "azureml_job_output": [5, 11, 33], "azureml_model": [5, 11, 33], "azuremlregistrymodel": 5, "azureml_registry_model": [5, 11, 33], "folder": [5, 10, 11, 15, 26], "string_nam": [5, 33], "azureml": [5, 7, 9, 29, 30], "azureml_cli": [5, 11, 33], "client": 5, "subscription_id": [5, 11, 26, 30, 33], "azur": [5, 24, 33, 35], "subscript": [5, 26, 30], "aml_config_path": [5, 30], "resource_group": [5, 11, 26, 30, 33], "workspace_nam": [5, 11, 26, 30, 33], "workspac": [5, 9, 11, 26, 29, 30, 33, 35], "read_timeout": [5, 26], "60": [5, 18], "read": [5, 17, 26], "second": [5, 9, 26, 30], "request": [5, 26], "max_operation_retri": [5, 26], "retri": [5, 26], "creation": [5, 26], "download": [5, 11, 26, 29, 35], "operation_retry_interv": [5, 26], "interv": [5, 26], "doubl": [5, 26], "default_auth_param": [5, 26], "auth": [5, 26], "u": [5, 24, 28], "ident": [5, 26, 35], "defaultazurecredenti": [5, 26], "view": 5, "get_workspace_config": 5, "get": [5, 25], "create_cli": 5, "mlclient": [5, 33], "create_registry_cli": 5, "registry_nam": [5, 11, 33], "datastor": [5, 26], "datastore_nam": [5, 11, 26, 33], "relative_path": [5, 11, 26, 33], "rel": [5, 11, 26, 33], "datastore_url": 5, "url": [5, 26], "job_nam": 5, "exhaust": [6, 9, 26, 28], "grid": 6, "space": [6, 9, 10, 26, 27, 34], "searcher": 6, "without": [6, 9, 26], "num_sampl": [6, 15, 26], "suggest": [6, 24], "rng": 6, "with_replac": 6, "tpe": [6, 9, 15, 26], "tree": [6, 9, 26], "parzen": [6, 9, 26], "estim": [6, 9, 26], "optuna": 6, "tpesampl": 6, "underneath": 6, "multivari": 6, "decompos": 6, "docker": [7, 9, 19, 26, 29], "pythonenviron": [7, 9, 35], "local_docker_config": [7, 35], "localdockerconfig": [7, 35], "is_dev": 7, "olive_managed_env": [7, 35], "requirements_fil": [7, 35], "image_nam": [7, 35], "base_imag": [7, 11, 26, 35], "requirements_file_path": 7, "dockerfil": [7, 35], "build_context_path": [7, 35], "build_arg": 7, "run_param": 7, "aml_comput": [7, 11, 26, 35], "aml_docker_config": [7, 11, 26, 35], "azuremldockerconfig": [7, 35], "instance_count": 7, "conda_file_path": [7, 11, 26, 35], "python_environment_path": [7, 35], "environment_vari": 7, "prepend_to_path": 7, "python_environ": [7, 35], "system_alia": 7, "azurend12ssystem": 7, "classvar": 7, "num_cpu": 7, "num_gpu": 7, "sku": 7, "standard_nd12": 7, "system_typ": 7, "azurend24rssystem": 7, "24": 7, "standard_nd24r": 7, "azurend24ssystem": 7, "standard_nd24": 7, "azurend6ssystem": 7, "6": [7, 10], "standard_nd6": 7, "azurend96a100system": 7, "96": 7, "standard_nd96amsr_a100_v4": 7, "azurend96asystem": 7, "standard_nd96asr_v4": 7, "azurendv2system": [7, 26, 35], "40": 7, "standard_nd40rs_v2": 7, "surfaceprosystem1796": 7, "surface_pro_1796": 7, "surfaceprosystem1807": 7, "surface_pro_1807": 7, "ptq": [8, 13, 14, 22], "resnet": [8, 22, 26, 27, 28], "cifar10": 8, "hw": [8, 16], "squeezenet": 8, "directml": [8, 10, 20], "dolli": 8, "v2": 8, "incept": 8, "amd": [8, 26], "section": [9, 11, 26, 31, 33], "discuss": 9, "concept": 9, "compos": [9, 25, 26, 31], "modular": 9, "construct": 9, "workflow": [9, 11, 12, 13, 15, 21, 23, 26, 27, 28, 33], "respons": [9, 27], "achiev": [9, 16], "sai": [9, 10, 12], "respect": [9, 16], "emploi": 9, "desir": [9, 16, 20, 25, 27, 28], "pareto": [9, 26], "frontier": [9, 26], "multi": 9, "meet": [9, 31], "goal": [9, 12, 16, 26, 32], "diagram": 9, "illustr": 9, "relationship": 9, "build": [9, 20, 25], "block": 9, "searchabl": [9, 10, 16, 26, 34], "chose": [9, 28, 34], "possibl": [9, 16, 27, 34], "fix": [9, 16, 19, 34], "certain": [9, 16, 34], "environ": [9, 16, 19, 20, 27, 29], "o": [9, 19, 27, 35], "hardwar": [9, 14, 16, 17, 25, 26, 27, 35], "spec": [9, 35], "platform": [9, 16, 17, 35], "ep": [9, 35], "thu": [9, 16, 26, 35], "ideal": 9, "deploy": [9, 25], "three": [9, 27, 34], "localsystem": [9, 26, 28, 35], "azuremlsystem": [9, 35], "dockersystem": [9, 35], "tp": 9, "token": [9, 13], "along": [9, 10, 18, 27, 31], "own": [9, 12, 13, 16, 25, 26, 31, 32, 33], "manag": [9, 11, 26, 30, 35], "intermedi": 9, "maintain": 9, "consist": 9, "sub": 9, "joint": [9, 15, 26, 28], "independ": 9, "trial": 9, "been": [9, 16, 28], "implement": [9, 13, 16, 17, 18, 19, 25, 26], "randomli": 9, "ampl": 9, "simpl": [10, 27, 28], "interfac": [10, 16, 28, 30], "introduc": [10, 13, 15, 16, 24], "newoptimizationtrick": 10, "_requires_user_script": 10, "next": [10, 15], "_default_config": 10, "passconfigparam": 10, "dataclass": 10, "hold": 10, "accelerator_typ": 10, "cudaexecutionprovid": 10, "belong": 10, "dml": 10, "sinc": [10, 15, 25, 34], "type_": 10, "categori": 10, "accept": [10, 27], "upload": 10, "normal": 10, "searchparamet": 10, "staticmethod": 10, "def": [10, 12, 13, 31, 32], "accelerator_spec": 10, "param1": 10, "param2": 10, "param3": 10, "objectclass": 10, "param4": 10, "union": 10, "paramcategori": 10, "anoth": [10, 14, 16, 26], "param5": 10, "param6": 10, "_run_for_config": 10, "engin": [10, 11, 15, 18, 19, 24, 25, 29, 35], "while": [10, 16, 25], "receiv": [10, 14, 26], "self": [10, 11, 12, 24], "output_model_path": 10, "document": [11, 13, 16, 19, 25, 26, 29, 32, 33, 34, 35], "outlin": 11, "discov": 11, "how": [11, 13, 16, 24, 25, 27, 28, 29], "asset": [11, 26, 30], "within": 11, "aml": [11, 26], "model_nam": [11, 13, 26, 31, 33], "model_vers": 11, "my_subscription_id": [11, 33], "my_resource_group": [11, 33], "my_workspac": [11, 33], "my_datastor": [11, 33], "model_dir": [11, 33], "my_model": [11, 33], "pt": [11, 27, 28, 33], "job_id": [11, 33], "my_job_id": [11, 33], "my_output_nam": [11, 33], "aml_system": [11, 26, 35], "cluster": [11, 24, 26, 35], "mcr": [11, 26, 35], "openmpi4": [11, 26, 35], "ubuntu20": [11, 26, 35], "04": [11, 19, 26, 35], "conda": [11, 20, 26, 35], "yaml": [11, 26, 35], "Then": [11, 21, 23, 29, 31], "link": [11, 18], "setup": [11, 21, 23, 27], "kubernet": [11, 24], "offer": [11, 25], "sever": [11, 26, 29, 31], "assist": [11, 26], "abil": [12, 16], "write": [12, 16, 17, 28], "task": [12, 13, 26, 27, 31], "your": [12, 13, 16, 20, 26, 27, 28, 29, 30, 32, 33], "post_processing_func": [12, 26, 32], "evaluate_func": [12, 26, 32], "openvinoquant": [12, 17, 26], "my_script": [12, 13], "mydataload": 12, "__init__": 12, "__len__": 12, "__getitem__": 12, "create_dataload": [12, 16, 17, 26, 28, 32], "post_process": [12, 26, 31, 32], "here": [12, 13, 16, 27, 28, 29, 31, 32], "prioriti": [12, 13, 15, 26, 28, 32], "degrad": [12, 26, 32], "append": [12, 14], "sy": 12, "interpret": 12, "place": [12, 26], "let": [12, 27, 28, 31, 34], "my_modul": 12, "my_olive_project": 12, "print": 12, "my_val": 12, "describ": [13, 16, 18, 26, 27, 32, 33, 34, 35], "simpli": [13, 21, 23, 31], "hub": [13, 26, 33], "uncas": [13, 26, 31], "text": [13, 26, 31], "classif": [13, 26, 31], "found": [13, 18, 26, 28], "just": [13, 27, 31], "processor": 13, "simplifi": [13, 25], "experi": [13, 16, 25], "demonstr": 13, "under": [13, 24, 26, 31], "glue": [13, 26, 31], "full": [13, 16, 27, 34], "data_nam": [13, 26, 31], "subset": [13, 26, 31], "mrpc": [13, 26, 31], "input_col": [13, 26, 31], "sentence1": [13, 26, 31], "sentence2": [13, 26, 31], "label_col": [13, 26, 31], "label": [13, 26, 31], "huggingface_metr": [13, 26], "f1": [13, 26], "input_model": [13, 26, 27, 28, 31, 33], "code": [13, 15, 18, 20, 21, 23, 27], "model_class": [13, 26], "whisperforconditionalgener": 13, "openai": 13, "medium": 13, "encoder_decoder_init": 13, "get_encdec_io_config": 13, "component_func": [13, 26], "get_encoder_decoder_init": 13, "encoder_decoder_init_dummy_input": 13, "get_dec_io_config": 13, "get_decod": 13, "decoder_dummy_input": 13, "dummi": [13, 26, 31], "complet": [13, 26, 27, 28, 31], "known": [14, 19, 27], "typic": [14, 27], "goe": 14, "through": [14, 16, 18, 26], "seri": 14, "readi": [14, 25, 28], "product": 14, "design": [14, 24], "nativ": 14, "lora": 14, "qlora": 14, "sparsegpt": 14, "torchtrtconvers": 14, "prerequisit": 14, "There": [15, 16, 24, 26, 31, 35], "onnxruntimepackag": 15, "top": [15, 33], "rank": [15, 18, 32], "histori": 15, "c": [15, 16, 18, 26, 30], "k": 15, "bestcandidatemodel_1": 15, "bestcandidatemodel_2": 15, "bestcandidatemodel_k": 15, "metric_1": 15, "metric_2": 15, "metric_3": 15, "sort": 15, "firstli": 15, "lower": [15, 18], "bestcandidatemodel": 15, "session_opt": [15, 26], "execution_mod": 15, "null": [15, 26, 31], "inter_op_num_thread": 15, "intra_op_num_thread": 15, "program": 15, "languag": 15, "And": 15, "snippet": 15, "packagingtyp": 15, "outputmodel": 15, "export_in_mlflow_format": 15, "mlflow": 15, "common_evalu": [15, 26, 27, 31], "local_system": [15, 26, 28, 35], "open": [16, 17], "cross": [16, 17], "flexibl": 16, "variou": [16, 25, 27], "onnxconvers": [16, 26, 27, 28], "besid": [16, 31], "exist": [16, 30], "onnxopversionconvers": [16, 26], "similar": 16, "abov": [16, 18, 21, 23, 26, 31], "onnxmodeloptim": [16, 26], "involv": 16, "singl": [16, 25, 31], "cost": 16, "analyz": 16, "identifi": [16, 27], "argmax": 16, "isn": 16, "inferenc": 16, "tensorproto": 16, "int64": [16, 31], "yet": 16, "orttransformersoptim": [16, 26], "capabl": 16, "These": [16, 28, 35], "done": 16, "appendprepostprocessingop": 16, "superresolut": 16, "output_format": 16, "png": 16, "use_audio_decod": 16, "leverag": [16, 31], "extens": [16, 18, 25], "placehold": 16, "__model_input__": 16, "__model_output__": 16, "iomapentri": 16, "ycbcrtopixel": 16, "bgr": 16, "io_map": 16, "y1_uint8": 16, "cb1_uint8": 16, "cr1_uint8": 16, "knowledg": 16, "built": [16, 26], "onnxextens": 16, "convertimagetobgr": 16, "incompat": 16, "web": 16, "kind": [16, 29], "proper": 16, "exactli": 16, "resiz": 16, "resize_to": 16, "input_index": 16, "dim_index": 16, "centercrop": 16, "height": 16, "width": [16, 18], "pixelstoycbcr": 16, "imagebytestofloat": 16, "unsqueez": 16, "ax": [16, 26], "squeez": 16, "floattoimagebyt": 16, "output_index": 16, "multipli": 16, "convertbgrtoimag": 16, "image_format": 16, "insertbeamsearch": 16, "chain": [16, 25], "compress": [16, 25], "deep": [16, 17, 18, 19, 31], "memori": [16, 17, 18], "zero": 16, "mean": [16, 26], "increas": [16, 18, 26], "usual": 16, "higher": [16, 26], "compar": 16, "ones": 16, "call": [16, 18, 28, 31, 32], "consolid": 16, "onnxquant": [16, 26, 28, 34], "hyperparamet": 16, "onnxdynamicquant": [16, 26, 27], "onnxstaticquant": [16, 26], "across": [16, 25], "popular": [16, 31], "mxnet": 16, "varieti": [16, 28], "power": 16, "distil": 16, "As": 16, "driven": 16, "friendli": 16, "focus": [16, 17], "easi": [16, 25], "strive": 16, "reach": 16, "everywher": 16, "incquant": [16, 26], "incdynamicquant": [16, 26], "incstaticquant": [16, 26], "complex": 16, "network": [16, 17, 19, 26], "less": 16, "bandwidth": 16, "faster": 16, "effici": [16, 17, 18, 25], "vitisaiquant": [16, 26], "olivepass": 16, "glue_calibration_read": [16, 34], "d": [16, 30], "onnx_quant": [16, 26, 34], "out": [16, 17, 18, 19, 29, 34], "high": 16, "ortperftun": [16, 26], "cover": 16, "knob": 16, "decreas": 16, "onnxfloattofloat16": 16, "wrap": 16, "onnxconverter_common": 16, "often": 16, "expos": [16, 26], "stage": 16, "stand": [16, 17], "alon": 16, "suit": 16, "architectur": 16, "reli": 16, "suitabl": [16, 25], "mani": 16, "grain": 16, "control": 16, "give": [16, 24, 26, 28], "poor": 16, "ortmixedprecis": 16, "minim": 16, "retain": 16, "layernorm": 16, "skiplayernorm": 16, "fastgelu": 16, "embedlayernorm": 16, "toolkit": 17, "visual": 17, "deploi": [17, 29], "anywher": 17, "2022": 17, "pip": [17, 27, 35], "dev": 17, "openvinoconvers": [17, 26], "ir": [17, 26], "now": [17, 27, 28], "uniform": 17, "move": 17, "help": [17, 30], "well": [17, 25, 26], "arithmet": 17, "undergo": 17, "actual": 17, "transit": 17, "happen": 17, "stat_requests_numb": 17, "eval_requests_numb": 17, "300": 17, "low": 18, "freez": 18, "inject": 18, "decomposit": 18, "matric": 18, "paper": 18, "peft": 18, "hftrainingargu": 18, "finetun": 18, "backpropag": 18, "frozen": 18, "pretrain": 18, "fake": 18, "quantizationawaretrain": [18, 26], "ptldatamodul": 18, "ptlmodul": 18, "create_train_dataload": 18, "gpt": 18, "shot": 18, "unstructur": 18, "upto": 18, "175b": 18, "176b": 18, "neglig": 18, "trtmodul": 18, "torch_tensorrt": 18, "regular": 18, "snapdragon": 19, "softwar": 19, "hexagon": 19, "dsp": 19, "variabl": [19, 29], "snpe_root": 19, "limit": 19, "ubuntu": 19, "18": 19, "work": [19, 25, 26, 35], "bin": 19, "sh": 19, "snpeconvers": [19, 26], "299": 19, "inceptionv3": 19, "predict": [19, 26], "reshape_1": 19, "1001": 19, "snpequant": [19, 26], "represent": 19, "32bit": 19, "bias": 19, "create_quant_dataload": 19, "virtual": 20, "public": 20, "pypi": 20, "With": [20, 25], "git": 20, "egg": 20, "contribut": 20, "clone": 20, "repositori": [20, 21, 23], "cd": 20, "tuner": [21, 23], "go": [21, 23], "quickstart": [21, 23, 24], "necessari": [21, 23, 27, 35], "r": [21, 23], "txt": [21, 23, 31, 35], "accord": [21, 23], "olive_run": [21, 23, 27, 28], "bert_auto": 21, "prepare_model_data": 23, "resnet_ptq_cpu": 23, "releas": 24, "feel": 24, "free": [24, 29], "feedback": 24, "quick": [24, 28], "tour": 24, "npu": 24, "artifact": [24, 26], "ml": [24, 25, 33, 35], "new": [24, 29, 30], "advanc": 24, "oliveevalu": 24, "searchalgorithm": 24, "industri": 25, "lead": [25, 28], "cloud": 25, "edg": 25, "constraint": 25, "consider": 25, "vendor": 25, "fragment": 25, "effort": 25, "util": 25, "toolchain": 25, "aim": 25, "aggreg": 25, "autom": 25, "unifi": 25, "serv": [25, 31], "easili": [25, 26, 31], "plugin": 25, "innov": 25, "e2": 25, "solut": 25, "organ": [25, 26, 29, 31], "overview": [25, 29], "introduct": 25, "guidanc": 25, "tutori": [25, 27, 29], "authent": 26, "credenti": 26, "account": 26, "too": 26, "small": 26, "3000": 26, "sometim": [26, 31], "hang": 26, "stream": 26, "issu": 26, "fail": 26, "exclude_managed_identity_credenti": 26, "4000": 26, "item": [26, 31], "insensit": [26, 34], "loader": [26, 28], "dynamic_ax": [26, 28], "index": 26, "axi": 26, "distilbert": 26, "from_pretrain": 26, "past": 26, "causal": 26, "lm": 26, "info": 26, "Such": 26, "distilbertforsequenceclassif": 26, "hfcompon": 26, "futur": 26, "mnli": 26, "page": [26, 29], "column": 26, "component_kwarg": 26, "pre_process_data": [26, 31], "align_label": 26, "align": 26, "label2id": 26, "co": 26, "nlp_process": 26, "model_config_path": 26, "model_config": 26, "fetch": 26, "tabl": [26, 31], "load_pytorch_origin_model": 26, "concaten": 26, "On": 26, "hand": 26, "home": [26, 29, 35], "line": [26, 28, 30], "config_fil": 26, "cifar": 26, "resourcegroup": 26, "alia": [26, 35], "uniqu": [26, 31], "among": 26, "torchmetr": 26, "binari": 26, "equal": 26, "metric_config": [26, 28, 32], "alter": 26, "subtyp": 26, "cannot": 26, "accuracysubtyp": [26, 32], "latencysubtyp": [26, 28, 32], "throughputsubtyp": [26, 32], "measur": [26, 27], "load_param": 26, "word_length": 26, "compute_param": 26, "pred": [26, 32], "result_kei": 26, "extract": 26, "9": 26, "higher_is_bett": [26, 32], "boolean": 26, "percent": [26, 32], "minimum": [26, 30], "model_framework": 26, "Not": 26, "func_kwarg": 26, "abl": [26, 29], "signatur": 26, "pars": 26, "our": 26, "enable_profil": 26, "definit": 26, "pass_flow": 26, "decid": [26, 34], "overridden": [26, 34], "clean": 26, "onnxtransformersoptim": 26, "snpetoonnxconvers": 26, "xilinx": 26, "optimumconvers": 26, "optimummerg": 26, "onnx_convers": [26, 27], "resnet_calibration_read": [26, 28], "transformers_optim": 26, "768": 26, "qualifi": 26, "stop": 26, "met": 26, "store": [26, 27, 33], "plot": 26, "log_severity_level": [26, 27], "verbos": [26, 27], "warn": 26, "error": 26, "fatal": 26, "ort_log_severity_level": 26, "ort_py_log_severity_level": 26, "log_to_fil": 26, "guid": [27, 28], "focu": 27, "simplest": 27, "my_model_acceleration_descript": 27, "equival": 27, "temporari": 27, "tempdir": 27, "reason": 27, "disk": 27, "permiss": 27, "special": 27, "cuda_visible_devic": 27, "linux": 27, "window": 27, "know": 27, "term": 27, "look": [27, 28, 31], "slightli": 27, "assum": 27, "my_evalu": 27, "my_latency_metr": 27, "user_provided_info": 28, "user_provided_info_json_fil": 28, "individu": 28, "standard": 28, "parse_obj": 28, "metrictyp": [28, 32], "latency_metr": [28, 32], "warmup_num": 28, "repeat_test_num": 28, "sleep_num": 28, "handl": 28, "onnx_conversion_config": 28, "quantization_config": 28, "best_execut": 28, "sure": 29, "k8": 29, "kube": 29, "kubeconfig": 29, "access": 29, "lunch": 29, "infrastructur": 29, "fill": 29, "minut": 29, "verif": 29, "attach": 29, "coupl": 30, "indic": 30, "mutual": 30, "exclus": 30, "delet": 30, "compute_nam": 30, "vm_size": 30, "vm": 30, "locat": 30, "min_nod": 30, "max_nod": 30, "idle_time_before_scale_down": 30, "idl": 30, "down": 30, "120": 30, "aml_config": 30, "open_llama_sparsegpt_gpu": 31, "dataset_1": 31, "dataset_2": 31, "letter": 31, "underscor": 31, "common_pass": 31, "dive": 31, "dummydatacontain": 31, "dummy_data_config_templ": 31, "params_config": 31, "input_id": 31, "attention_mask": 31, "token_type_id": 31, "huggingfacecontain": 31, "huggingface_data_config_templ": 31, "task_typ": 31, "rawdatacontain": 31, "raw_data": 31, "224": 31, "input_dir": 31, "input_suffix": 31, "input_order_fil": 31, "input_ord": 31, "datacontain": 31, "four": 31, "load_dataset": 31, "local_dataset": 31, "simple_dataset": 31, "huggingface_dataset": 31, "raw_dataset": 31, "pre_process": 31, "huggingface_pre_process": 31, "ner_huggingface_preprocess": 31, "text_generation_huggingface_pre_process": 31, "post_process_data": 31, "text_classification_post_process": 31, "ner_post_process": 31, "text_generation_post_process": 31, "default_dataload": 31, "skip_dataload": 31, "no_auto_batch_dataload": 31, "_huggingface_dataset": 31, "data_fil": 31, "_huggingface_pre_process": 31, "max_sampl": 31, "_text_classification_post_process": 31, "_default_dataload": 31, "show": 31, "rewrit": 31, "But": 31, "user_dir": 31, "customized_huggingface_dataset": 31, "registri": 31, "register_dataset": 31, "_output": 31, "register_pre_process": 31, "customized_huggingface_pre_process": 31, "register_post_process": 31, "customized_post_process": 31, "register_dataload": 31, "customized_dataload": 31, "inception_post_process": 31, "inception_snpe_qualcomm_npu": 31, "l8": 31, "l10": 31, "json_config": 31, "inception_config": 31, "l14": 31, "l16": 31, "dummy_dataset_dataroot": 31, "unit_test": 31, "test_data_root": 31, "l31": 31, "l107": 31, "conflict": 31, "metricgo": 32, "accuracy_metr": 32, "throughput_metr": 32, "accuracy_custom": 32, "eval_accuraci": 32, "altern": 32, "yourself": 32, "model_output": 32, "logit": 32, "omit": [32, 33], "my_model_dir": 33, "curat": 33, "doesn": 33, "still": 33, "fulli": 34, "thing": 34, "redund": 34, "olive_pass": 34, "create_pass_from_dict": 34, "localtargetuserconfig": 35, "docker_config": 35, "azuremltargetuserconfig": 35, "docker_system": 35, "mnist_requir": 35, "dockertargetuserconfig": 35, "virtualenv": 35, "myenv": 35, "pythonenvironmentsystem": 35, "python_environment_system": 35, "pythonenvironmenttargetuserconfig": 35}, "objects": {"olive.azureml.azureml_client": [[5, 0, 1, "", "AzureMLClientConfig"]], "olive.azureml.azureml_client.AzureMLClientConfig": [[5, 1, 1, "", "aml_config_path"], [5, 2, 1, "", "create_client"], [5, 2, 1, "", "create_registry_client"], [5, 1, 1, "", "default_auth_params"], [5, 2, 1, "", "get_workspace_config"], [5, 1, 1, "", "max_operation_retries"], [5, 1, 1, "", "operation_retry_interval"], [5, 1, 1, "", "read_timeout"], [5, 1, 1, "", "resource_group"], [5, 1, 1, "", "subscription_id"], [5, 1, 1, "", "workspace_name"]], "olive.engine": [[0, 3, 1, "", "Engine"], [0, 0, 1, "", "EngineConfig"]], "olive.engine.Engine": [[0, 2, 1, "", "register"], [0, 2, 1, "", "run"]], "olive.engine.EngineConfig": [[0, 1, 1, "", "azureml_client_config"], [0, 1, 1, "", "cache_dir"], [0, 1, 1, "", "clean_cache"], [0, 1, 1, "", "clean_evaluation_cache"], [0, 1, 1, "", "evaluator"], [0, 1, 1, "", "execution_providers"], [0, 1, 1, "", "host"], [0, 1, 1, "", "packaging_config"], [0, 1, 1, "", "plot_pareto_frontier"], [0, 1, 1, "", "search_strategy"], [0, 1, 1, "", "target"]], "olive.evaluator.metric": [[2, 3, 1, "", "AccuracySubType"], [2, 3, 1, "", "LatencySubType"], [2, 0, 1, "", "Metric"], [2, 0, 1, "", "MetricGoal"], [2, 3, 1, "", "MetricType"], [2, 3, 1, "", "ThroughputSubType"]], "olive.evaluator.metric.AccuracySubType": [[2, 4, 1, "", "ACCURACY_SCORE"], [2, 4, 1, "", "AUROC"], [2, 4, 1, "", "F1_SCORE"], [2, 4, 1, "", "PERPLEXITY"], [2, 4, 1, "", "PRECISION"], [2, 4, 1, "", "RECALL"]], "olive.evaluator.metric.LatencySubType": [[2, 4, 1, "", "AVG"], [2, 4, 1, "", "MAX"], [2, 4, 1, "", "MIN"], [2, 4, 1, "", "P50"], [2, 4, 1, "", "P75"], [2, 4, 1, "", "P90"], [2, 4, 1, "", "P95"], [2, 4, 1, "", "P99"], [2, 4, 1, "", "P999"]], "olive.evaluator.metric.Metric": [[2, 1, 1, "", "backend"], [2, 1, 1, "", "data_config"], [2, 2, 1, "", "get_sub_type_info"], [2, 1, 1, "", "name"], [2, 1, 1, "", "sub_types"], [2, 1, 1, "", "type"], [2, 1, 1, "", "user_config"]], "olive.evaluator.metric.MetricGoal": [[2, 1, 1, "", "type"], [2, 1, 1, "", "value"]], "olive.evaluator.metric.MetricType": [[2, 4, 1, "", "ACCURACY"], [2, 4, 1, "", "CUSTOM"], [2, 4, 1, "", "LATENCY"], [2, 4, 1, "", "THROUGHPUT"]], "olive.evaluator.metric.ThroughputSubType": [[2, 4, 1, "", "AVG"], [2, 4, 1, "", "MAX"], [2, 4, 1, "", "MIN"], [2, 4, 1, "", "P50"], [2, 4, 1, "", "P75"], [2, 4, 1, "", "P90"], [2, 4, 1, "", "P95"], [2, 4, 1, "", "P99"], [2, 4, 1, "", "P999"]], "olive.evaluator.olive_evaluator": [[1, 3, 1, "", "OliveEvaluator"], [0, 0, 1, "", "OliveEvaluatorConfig"]], "olive.evaluator.olive_evaluator.OliveEvaluatorConfig": [[0, 1, 1, "", "metrics"]], "olive.model": [[3, 3, 1, "", "CompositeOnnxModel"], [3, 3, 1, "", "CompositePyTorchModel"], [3, 3, 1, "", "DistributedOnnxModel"], [3, 3, 1, "", "DistributedPyTorchModel"], [3, 3, 1, "", "ModelConfig"], [3, 3, 1, "", "ONNXModel"], [3, 3, 1, "", "OpenVINOModel"], [3, 3, 1, "", "PyTorchModel"], [3, 3, 1, "", "SNPEModel"]], "olive.passes.pytorch.lora": [[4, 0, 1, "", "HFTrainingArguments"]], "olive.passes.pytorch.lora.HFTrainingArguments": [[4, 2, 1, "", "create_training_args"], [4, 1, 1, "", "data_seed"], [4, 1, 1, "", "eval_steps"], [4, 1, 1, "", "evaluation_strategy"], [4, 1, 1, "", "extra_args"], [4, 1, 1, "", "gradient_accumulation_steps"], [4, 1, 1, "", "gradient_checkpointing"], [4, 1, 1, "", "group_by_length"], [4, 1, 1, "", "learning_rate"], [4, 1, 1, "", "logging_steps"], [4, 1, 1, "", "lr_scheduler_type"], [4, 1, 1, "", "max_steps"], [4, 1, 1, "", "optim"], [4, 1, 1, "", "output_dir"], [4, 1, 1, "", "per_device_eval_batch_size"], [4, 1, 1, "", "per_device_train_batch_size"], [4, 1, 1, "", "report_to"], [4, 1, 1, "", "seed"], [4, 1, 1, "", "warmup_ratio"], [4, 1, 1, "", "weight_decay"]], "olive.resource_path": [[5, 3, 1, "", "ResourceType"]], "olive.resource_path.ResourceType": [[5, 4, 1, "", "AzureMLDatastore"], [5, 4, 1, "", "AzureMLJobOutput"], [5, 4, 1, "", "AzureMLModel"], [5, 4, 1, "", "AzureMLRegistryModel"], [5, 4, 1, "", "LocalFile"], [5, 4, 1, "", "LocalFolder"], [5, 4, 1, "", "StringName"]], "olive.strategy.search_strategy": [[0, 3, 1, "", "SearchStrategy"], [0, 0, 1, "", "SearchStrategyConfig"]], "olive.strategy.search_strategy.SearchStrategyConfig": [[0, 1, 1, "", "execution_order"], [0, 1, 1, "", "max_iter"], [0, 1, 1, "", "max_time"], [0, 1, 1, "", "output_model_num"], [0, 1, 1, "", "search_algorithm"], [0, 1, 1, "", "search_algorithm_config"], [0, 1, 1, "", "stop_when_goals_met"]], "olive.systems.azureml": [[7, 0, 1, "", "AzureMLDockerConfig"], [7, 3, 1, "", "AzureMLSystem"]], "olive.systems.azureml.AzureMLDockerConfig": [[7, 1, 1, "", "base_image"], [7, 1, 1, "", "build_context_path"], [7, 1, 1, "", "conda_file_path"], [7, 1, 1, "", "dockerfile"]], "olive.systems.common": [[7, 3, 1, "", "SystemType"]], "olive.systems.common.SystemType": [[7, 4, 1, "", "AzureML"], [7, 4, 1, "", "Docker"], [7, 4, 1, "", "Local"], [7, 4, 1, "", "PythonEnvironment"]], "olive.systems.docker": [[7, 3, 1, "", "DockerSystem"], [7, 0, 1, "", "LocalDockerConfig"]], "olive.systems.docker.LocalDockerConfig": [[7, 1, 1, "", "base_image"], [7, 1, 1, "", "build_args"], [7, 1, 1, "", "build_context_path"], [7, 1, 1, "", "dockerfile"], [7, 1, 1, "", "image_name"], [7, 1, 1, "", "requirements_file_path"], [7, 1, 1, "", "run_params"]], "olive.systems.local": [[7, 3, 1, "", "LocalSystem"]], "olive.systems.python_environment": [[7, 3, 1, "", "PythonEnvironmentSystem"]], "olive.systems": [[7, 5, 0, "-", "system_alias"]], "olive.systems.system_alias": [[7, 3, 1, "", "AzureND12SSystem"], [7, 3, 1, "", "AzureND24RSSystem"], [7, 3, 1, "", "AzureND24SSystem"], [7, 3, 1, "", "AzureND6SSystem"], [7, 3, 1, "", "AzureND96A100System"], [7, 3, 1, "", "AzureND96ASystem"], [7, 3, 1, "", "AzureNDV2System"], [7, 3, 1, "", "SurfaceProSystem1796"], [7, 3, 1, "", "SurfaceProSystem1807"]], "olive.systems.system_alias.AzureND12SSystem": [[7, 4, 1, "", "accelerators"], [7, 4, 1, "", "num_cpus"], [7, 4, 1, "", "num_gpus"], [7, 4, 1, "", "sku"], [7, 4, 1, "", "system_type"]], "olive.systems.system_alias.AzureND24RSSystem": [[7, 4, 1, "", "accelerators"], [7, 4, 1, "", "num_cpus"], [7, 4, 1, "", "num_gpus"], [7, 4, 1, "", "sku"], [7, 4, 1, "", "system_type"]], "olive.systems.system_alias.AzureND24SSystem": [[7, 4, 1, "", "accelerators"], [7, 4, 1, "", "num_cpus"], [7, 4, 1, "", "num_gpus"], [7, 4, 1, "", "sku"], [7, 4, 1, "", "system_type"]], "olive.systems.system_alias.AzureND6SSystem": [[7, 4, 1, "", "accelerators"], [7, 4, 1, "", "num_cpus"], [7, 4, 1, "", "num_gpus"], [7, 4, 1, "", "sku"], [7, 4, 1, "", "system_type"]], "olive.systems.system_alias.AzureND96A100System": [[7, 4, 1, "", "accelerators"], [7, 4, 1, "", "num_cpus"], [7, 4, 1, "", "num_gpus"], [7, 4, 1, "", "sku"], [7, 4, 1, "", "system_type"]], "olive.systems.system_alias.AzureND96ASystem": [[7, 4, 1, "", "accelerators"], [7, 4, 1, "", "num_cpus"], [7, 4, 1, "", "num_gpus"], [7, 4, 1, "", "sku"], [7, 4, 1, "", "system_type"]], "olive.systems.system_alias.AzureNDV2System": [[7, 4, 1, "", "accelerators"], [7, 4, 1, "", "num_cpus"], [7, 4, 1, "", "num_gpus"], [7, 4, 1, "", "sku"], [7, 4, 1, "", "system_type"]], "olive.systems.system_alias.SurfaceProSystem1796": [[7, 4, 1, "", "accelerators"], [7, 4, 1, "", "sku"], [7, 4, 1, "", "system_type"]], "olive.systems.system_alias.SurfaceProSystem1807": [[7, 4, 1, "", "accelerators"], [7, 4, 1, "", "sku"], [7, 4, 1, "", "system_type"]], "olive.systems.system_config": [[7, 0, 1, "", "AzureMLTargetUserConfig"], [7, 0, 1, "", "DockerTargetUserConfig"], [7, 0, 1, "", "LocalTargetUserConfig"], [7, 0, 1, "", "PythonEnvironmentTargetUserConfig"], [7, 0, 1, "", "SystemConfig"]], "olive.systems.system_config.AzureMLTargetUserConfig": [[7, 1, 1, "", "aml_compute"], [7, 1, 1, "", "aml_docker_config"], [7, 1, 1, "", "azureml_client_config"], [7, 1, 1, "", "instance_count"], [7, 1, 1, "", "is_dev"], [7, 1, 1, "", "olive_managed_env"], [7, 1, 1, "", "requirements_file"], [7, 1, 1, "", "resources"]], "olive.systems.system_config.DockerTargetUserConfig": [[7, 1, 1, "", "is_dev"], [7, 1, 1, "", "local_docker_config"], [7, 1, 1, "", "olive_managed_env"], [7, 1, 1, "", "requirements_file"]], "olive.systems.system_config.LocalTargetUserConfig": [[7, 1, 1, "", "accelerators"]], "olive.systems.system_config.PythonEnvironmentTargetUserConfig": [[7, 1, 1, "", "environment_variables"], [7, 1, 1, "", "olive_managed_env"], [7, 1, 1, "", "prepend_to_path"], [7, 1, 1, "", "python_environment_path"], [7, 1, 1, "", "requirements_file"]], "olive.systems.system_config.SystemConfig": [[7, 1, 1, "", "config"], [7, 2, 1, "", "create_system"], [7, 1, 1, "", "type"]], "": [[4, 6, 1, "cmdoption-arg-ActivationSymmetric", "ActivationSymmetric"], [4, 6, 1, "cmdoption-arg-AddQDQPairToWeight", "AddQDQPairToWeight"], [4, 6, 1, "cmdoption-arg-EnableSubgraph", "EnableSubgraph"], [4, 6, 1, "cmdoption-arg-ForceQuantizeNoInputCheck", "ForceQuantizeNoInputCheck"], [4, 6, 1, "cmdoption-arg-MatMulConstBOnly", "MatMulConstBOnly"], [4, 6, 1, "cmdoption-arg-WeightSymmetric", "WeightSymmetric"], [4, 6, 1, "cmdoption-arg-activation_type", "activation_type"], [4, 6, 1, "cmdoption-arg-algorithms", "algorithms"], [4, 6, 1, "cmdoption-arg-all_tensors_to_one_file", "all_tensors_to_one_file"], [4, 6, 1, "cmdoption-arg-allow_tf32", "allow_tf32"], [4, 6, 1, "cmdoption-arg-approach", "approach"], [4, 6, 1, "cmdoption-arg-atol", "atol"], [5, 6, 1, "cmdoption-arg-azureml_client", "azureml_client"], [4, 6, 1, "cmdoption-arg-backend", "backend"], [4, 6, 1, "cmdoption-arg-batch_size", "batch_size"], [4, 6, 1, "cmdoption-arg-bias", "bias"], [4, 6, 1, "cmdoption-arg-blocksize", "blocksize"], [4, 6, 1, "cmdoption-arg-calibrate_method", "calibrate_method"], [4, 6, 1, "cmdoption-arg-calibration_sampling_size", "calibration_sampling_size"], [4, 6, 1, "cmdoption-arg-checkpoint_path", "checkpoint_path"], [4, 6, 1, "cmdoption-arg-compute_device", "compute_device"], [4, 6, 1, "cmdoption-arg-compute_dtype", "compute_dtype"], [4, 6, 1, "cmdoption-arg-convert_attribute", "convert_attribute"], [4, 6, 1, "cmdoption-arg-cpu_cores", "cpu_cores"], [4, 6, 1, "cmdoption-arg-data_config", "data_config"], [4, 6, 1, "cmdoption-arg-data_dir", "data_dir"], [4, 6, 1, "cmdoption-arg-dataloader_func", "dataloader_func"], [4, 6, 1, "cmdoption-arg-dataloader_func_kwargs", "dataloader_func_kwargs"], [5, 6, 1, "cmdoption-arg-datastore_name", "datastore_name"], [5, 6, 1, "cmdoption-arg-datastore_url", "datastore_url"], [4, 6, 1, "cmdoption-arg-device", "device"], [4, 6, 1, "cmdoption-arg-disable_shape_infer", "disable_shape_infer"], [4, 6, 1, "cmdoption-arg-do_validate", "do_validate"], [4, 6, 1, "cmdoption-arg-domain", "domain"], [4, 6, 1, "cmdoption-arg-double_quant", "double_quant"], [4, 6, 1, "cmdoption-arg-enable_cuda_graph", "enable_cuda_graph"], [4, 6, 1, "cmdoption-arg-enable_dpu", "enable_dpu"], [4, 6, 1, "cmdoption-arg-enable_htp", "enable_htp"], [4, 6, 1, "cmdoption-arg-engine_config", "engine_config"], [4, 6, 1, "cmdoption-arg-eval_data_config", "eval_data_config"], [4, 6, 1, "cmdoption-arg-eval_dataset_size", "eval_dataset_size"], [4, 6, 1, "cmdoption-arg-excluded_precisions", "excluded_precisions"], [4, 6, 1, "cmdoption-arg-execution_mode_list", "execution_mode_list"], [4, 6, 1, "cmdoption-arg-external_data_name", "external_data_name"], [4, 6, 1, "cmdoption-arg-extra_args", "extra_args"], [4, 6, 1, "cmdoption-arg-extra_config", "extra_config"], [4, 6, 1, "cmdoption-arg-extra_options", "extra_options"], [4, 6, 1, "cmdoption-arg-extra_session_config", "extra_session_config"], [4, 6, 1, "cmdoption-arg-float16", "float16"], [4, 6, 1, "cmdoption-arg-force_fp16_inputs", "force_fp16_inputs"], [4, 6, 1, "cmdoption-arg-force_fp32_nodes", "force_fp32_nodes"], [4, 6, 1, "cmdoption-arg-force_fp32_ops", "force_fp32_ops"], [4, 6, 1, "cmdoption-arg-fp16", "fp16"], [4, 6, 1, "cmdoption-arg-gpus", "gpus"], [6, 6, 1, "cmdoption-arg-group", "group"], [4, 6, 1, "cmdoption-arg-hidden_size", "hidden_size"], [4, 6, 1, "cmdoption-arg-htp_socs", "htp_socs"], [4, 6, 1, "cmdoption-arg-input", "input"], [4, 6, 1, "cmdoption-arg-input_int32", "input_int32"], [4, 6, 1, "cmdoption-arg-input_layouts", "input_layouts"], [4, 6, 1, "cmdoption-arg-input_names", "input_names"], [4, 6, 1, "cmdoption-arg-input_nodes", "input_nodes"], [4, 6, 1, "cmdoption-arg-input_shape", "input_shape"], [4, 6, 1, "cmdoption-arg-input_shapes", "input_shapes"], [4, 6, 1, "cmdoption-arg-input_types", "input_types"], [4, 6, 1, "cmdoption-arg-inter_thread_num_list", "inter_thread_num_list"], [4, 6, 1, "cmdoption-arg-intra_thread_num_list", "intra_thread_num_list"], [4, 6, 1, "cmdoption-arg-io_bind", "io_bind"], [5, 6, 1, "cmdoption-arg-job_name", "job_name"], [4, 6, 1, "cmdoption-arg-keep_io_types", "keep_io_types"], [4, 6, 1, "cmdoption-arg-layer_name_filter", "layer_name_filter"], [4, 6, 1, "cmdoption-arg-logger", "logger"], [4, 6, 1, "cmdoption-arg-lora_alpha", "lora_alpha"], [4, 6, 1, "cmdoption-arg-lora_dropout", "lora_dropout"], [4, 6, 1, "cmdoption-arg-lora_r", "lora_r"], [4, 6, 1, "cmdoption-arg-max_finite_val", "max_finite_val"], [4, 6, 1, "cmdoption-arg-max_layer", "max_layer"], [4, 6, 1, "cmdoption-arg-metric", "metric"], [4, 6, 1, "cmdoption-arg-metric_func", "metric_func"], [4, 6, 1, "cmdoption-arg-min_layer", "min_layer"], [4, 6, 1, "cmdoption-arg-min_positive_val", "min_positive_val"], [4, 6, 1, "cmdoption-arg-model_type", "model_type"], [4, 6, 1, "cmdoption-arg-modules_to_fuse", "modules_to_fuse"], [4, 6, 1, "cmdoption-arg-modules_to_save", "modules_to_save"], [6, 6, 1, "cmdoption-arg-multivariate", "multivariate"], [5, 6, 1, "cmdoption-arg-name", "name"], [4, 6, 1, "cmdoption-arg-need_layer_fusing", "need_layer_fusing"], [4, 6, 1, "cmdoption-arg-no_post_process", "no_post_process"], [4, 6, 1, "cmdoption-arg-no_repeat_ngram_size", "no_repeat_ngram_size"], [4, 6, 1, "cmdoption-arg-node_block_list", "node_block_list"], [4, 6, 1, "cmdoption-arg-nodes_to_exclude", "nodes_to_exclude"], [4, 6, 1, "cmdoption-arg-nodes_to_quantize", "nodes_to_quantize"], [4, 6, 1, "cmdoption-arg-num_epochs", "num_epochs"], [4, 6, 1, "cmdoption-arg-num_heads", "num_heads"], [6, 6, 1, "cmdoption-arg-num_samples", "num_samples"], [4, 6, 1, "cmdoption-arg-num_steps", "num_steps"], [4, 6, 1, "cmdoption-arg-only_onnxruntime", "only_onnxruntime"], [4, 6, 1, "cmdoption-arg-op_block_list", "op_block_list"], [4, 6, 1, "cmdoption-arg-op_type_dict", "op_type_dict"], [4, 6, 1, "cmdoption-arg-op_types_to_quantize", "op_types_to_quantize"], [4, 6, 1, "cmdoption-arg-opt_level", "opt_level"], [4, 6, 1, "cmdoption-arg-opt_level_list", "opt_level_list"], [4, 6, 1, "cmdoption-arg-optimization_options", "optimization_options"], [4, 6, 1, "cmdoption-arg-optimize_model", "optimize_model"], [4, 6, 1, "cmdoption-arg-ortmodule_onnx_opset_version", "ortmodule_onnx_opset_version"], [5, 6, 1, "cmdoption-arg-output_name", "output_name"], [4, 6, 1, "cmdoption-arg-output_names", "output_names"], [4, 6, 1, "cmdoption-arg-output_nodes", "output_nodes"], [4, 6, 1, "cmdoption-arg-parallel_jobs", "parallel_jobs"], [5, 6, 1, "cmdoption-arg-path", "path"], [4, 6, 1, "cmdoption-arg-per_channel", "per_channel"], [4, 6, 1, "cmdoption-arg-percdamp", "percdamp"], [4, 6, 1, "cmdoption-arg-post", "post"], [4, 6, 1, "cmdoption-arg-pre", "pre"], [4, 6, 1, "cmdoption-arg-providers_list", "providers_list"], [4, 6, 1, "cmdoption-arg-ptl_data_module", "ptl_data_module"], [4, 6, 1, "cmdoption-arg-ptl_module", "ptl_module"], [4, 6, 1, "cmdoption-arg-qconfig_func", "qconfig_func"], [4, 6, 1, "cmdoption-arg-quant_format", "quant_format"], [4, 6, 1, "cmdoption-arg-quant_level", "quant_level"], [4, 6, 1, "cmdoption-arg-quant_mode", "quant_mode"], [4, 6, 1, "cmdoption-arg-quant_preprocess", "quant_preprocess"], [4, 6, 1, "cmdoption-arg-quant_type", "quant_type"], [4, 6, 1, "cmdoption-arg-recipes", "recipes"], [4, 6, 1, "cmdoption-arg-reduce_range", "reduce_range"], [5, 6, 1, "cmdoption-arg-relative_path", "relative_path"], [4, 6, 1, "cmdoption-arg-save_as_external_data", "save_as_external_data"], [4, 6, 1, "cmdoption-arg-script_dir", "script_dir"], [4, 6, 1, "cmdoption-arg-seed", "seed"], [4, 6, 1, "cmdoption-arg-size_threshold", "size_threshold"], [4, 6, 1, "cmdoption-arg-sparsity", "sparsity"], [4, 6, 1, "cmdoption-arg-strict", "strict"], [4, 6, 1, "cmdoption-arg-target_device", "target_device"], [4, 6, 1, "cmdoption-arg-target_modules", "target_modules"], [4, 6, 1, "cmdoption-arg-target_opset", "target_opset"], [4, 6, 1, "cmdoption-arg-tool_command", "tool_command"], [4, 6, 1, "cmdoption-arg-tool_command_args", "tool_command_args"], [4, 6, 1, "cmdoption-arg-torch_dtype", "torch_dtype"], [4, 6, 1, "cmdoption-arg-train_batch_size", "train_batch_size"], [4, 6, 1, "cmdoption-arg-train_data_config", "train_data_config"], [4, 6, 1, "cmdoption-arg-train_data_dir", "train_data_dir"], [4, 6, 1, "cmdoption-arg-train_dataloader_func", "train_dataloader_func"], [4, 6, 1, "cmdoption-arg-training_args", "training_args"], [4, 6, 1, "cmdoption-arg-training_loop_func", "training_loop_func"], [4, 6, 1, "cmdoption-arg-trt_fp16_enable", "trt_fp16_enable"], [4, 6, 1, "cmdoption-arg-tuning_criterion", "tuning_criterion"], [4, 6, 1, "cmdoption-arg-use_device", "use_device"], [4, 6, 1, "cmdoption-arg-use_dynamo_exporter", "use_dynamo_exporter"], [4, 6, 1, "cmdoption-arg-use_enhanced_quantizer", "use_enhanced_quantizer"], [4, 6, 1, "cmdoption-arg-use_external_data_format", "use_external_data_format"], [4, 6, 1, "cmdoption-arg-use_forced_decoder_ids", "use_forced_decoder_ids"], [4, 6, 1, "cmdoption-arg-use_gpu", "use_gpu"], [4, 6, 1, "cmdoption-arg-use_gqa", "use_gqa"], [4, 6, 1, "cmdoption-arg-use_ort_trainer", "use_ort_trainer"], [4, 6, 1, "cmdoption-arg-user_script", "user_script"], [4, 6, 1, "cmdoption-arg-val_data_dir", "val_data_dir"], [5, 6, 1, "cmdoption-arg-version", "version"], [4, 6, 1, "cmdoption-arg-weight_only_config", "weight_only_config"], [4, 6, 1, "cmdoption-arg-weight_type", "weight_type"], [6, 6, 1, "cmdoption-arg-with_replacement", "with_replacement"]], "extra.Sigmoid": [[4, 6, 1, "cmdoption-arg-extra.Sigmoid.nnapi", "nnapi"]]}, "objtypes": {"0": "py:pydantic_settings", "1": "py:pydantic_field", "2": "py:method", "3": "py:class", "4": "py:attribute", "5": "py:module", "6": "std:cmdoption"}, "objnames": {"0": ["py", "pydantic_settings", "Python settings"], "1": ["py", "pydantic_field", "Python field"], "2": ["py", "method", "Python method"], "3": ["py", "class", "Python class"], "4": ["py", "attribute", "Python attribute"], "5": ["py", "module", "Python module"], "6": ["std", "cmdoption", "program option"]}, "titleterms": {"engin": [0, 9, 26, 27, 28], "engineconfig": 0, "searchstrategi": 0, "oliveevalu": 1, "metric": [2, 13, 32], "metrictyp": 2, "accuracysubtyp": 2, "latencysubtyp": 2, "throughputsubtyp": 2, "metricgo": 2, "olivemodel": 3, "model": [3, 11, 13, 14, 16, 17, 19, 21, 23, 26, 27, 28, 33], "configur": [3, 10, 16, 17, 18, 19, 31, 32, 34, 35], "onnx": [3, 16], "compositeonnxmodel": 3, "distributedonnxmodel": 3, "openvino": [3, 17], "pytorch": [3, 18], "distributedpytorchmodel": 3, "snpe": [3, 19], "compositepytorchmodel": 3, "pass": [4, 9, 10, 26, 27, 28, 34], "onnxconvers": 4, "onnxopversionconvers": 4, "onnxmodeloptim": 4, "orttransformersoptim": 4, "ortperftun": 4, "onnxfloattofloat16": 4, "ortmixedprecis": 4, "onnxdynamicquant": 4, "onnxstaticquant": 4, "onnxquant": 4, "incdynamicquant": 4, "incstaticquant": 4, "incquant": 4, "appendprepostprocessingop": 4, "insertbeamsearch": 4, "lora": [4, 18], "qlora": [4, 18], "hftrainingargu": 4, "quantizationawaretrain": 4, "openvinoconvers": 4, "openvinoquant": 4, "snpeconvers": 4, "snpequant": 4, "snpetoonnxconvers": 4, "sparsegpt": [4, 18], "torchtrtconvers": [4, 18], "vitisaiquant": 4, "optimumconvers": 4, "optimummerg": 4, "resourcepath": 5, "resourcetyp": 5, "localfil": 5, "localfold": 5, "stringnam": 5, "azuremlmodel": 5, "azuremldatastor": 5, "azuremljoboutput": 5, "searchalgorithm": 6, "exhaustivesearchalgorithm": 6, "randomsearchalgorithm": 6, "tpesearchalgorithm": 6, "olivesystem": 7, "config": [7, 13, 15, 21, 23, 26, 31], "systemtyp": 7, "localtargetuserconfig": 7, "dockertargetuserconfig": 7, "azuremltargetuserconfig": 7, "pythonenvironmenttargetuserconfig": 7, "class": [7, 10], "localsystem": 7, "azuremlsystem": 7, "dockersystem": 7, "pythonenvironmentsystem": 7, "system": [7, 9, 19, 26, 28, 35], "alia": 7, "acceler": [8, 27], "cpu": [8, 21, 23], "gpu": 8, "npu": 8, "dpu": 8, "design": 9, "evalu": [9, 26, 28], "search": [9, 16], "strategi": 9, "execut": 9, "order": 9, "algorithm": 9, "how": [10, 15, 31, 32, 33, 34, 35], "add": [10, 29], "new": 10, "optim": [10, 13, 14, 16, 21, 23], "1": [10, 17], "defin": 10, "2": [10, 17], "exampl": [10, 12, 13, 16, 17, 18, 19, 22, 24, 26], "3": 10, "implement": 10, "run": [10, 21, 23, 28], "function": 10, "azur": [11, 26, 29, 30], "ml": [11, 26, 30], "integr": 11, "oliv": [11, 15, 17, 19, 24, 25, 26, 27], "core": 11, "us": [11, 21, 23], "azureml": [11, 26, 33, 35], "regist": [11, 28], "curat": 11, "store": 11, "datastor": [11, 33], "from": [11, 17, 20], "an": 11, "job": [11, 33], "output": [11, 33], "data": [11, 23, 26, 31], "comput": 11, "host": [11, 28, 29], "target": [11, 28], "connect": 11, "your": 11, "own": 11, "devic": 11, "arc": [11, 29], "helper": 11, "script": [11, 12, 13, 30], "custom": [12, 13, 31, 32], "user_script": 12, "script_dir": 12, "huggingfac": 13, "introduct": 13, "dataset": 13, "compon": [13, 31], "e2": 13, "transform": [14, 16], "packag": 15, "artifact": 15, "what": 15, "i": 15, "zipfil": 15, "candidatemodel": 15, "infer": 15, "file": [15, 33], "samplecod": 15, "convers": [16, 17, 19], "ort": 16, "append": 16, "pre": 16, "post": [16, 17, 19], "process": 16, "op": 16, "insert": 16, "beam": 16, "train": [16, 17, 18, 19], "quantiz": [16, 17, 18, 19], "ptq": [16, 17, 19, 21, 23], "onnxruntim": 16, "intel": 16, "neural": 16, "compressor": 16, "amd": 16, "viti": 16, "ai": 16, "perform": [16, 27], "tune": 16, "float16": 16, "mix": 16, "precis": 16, "prerequisit": [17, 19, 21, 23, 35], "option": [17, 20, 26], "instal": [17, 19, 20], "extra": 17, "runtim": 17, "develop": 17, "tool": 17, "pypi": 17, "awar": 18, "download": 19, "unzip": 19, "sdk": 19, "depend": [19, 20], "pip": [20, 21, 23], "sourc": 20, "edit": 20, "bert": 21, "requir": [21, 23, 27], "sampl": [21, 23], "The": 21, "techniqu": 21, "ar": 21, "specifi": 21, "bert_ptq_cpu": 21, "json": [21, 26], "automat": 21, "without": 21, "select": 21, "ani": 21, "quickstart": 22, "resnet": 23, "prepar": 23, "welcom": 24, "": 24, "document": 24, "overview": 24, "get": 24, "start": 24, "featur": 24, "extend": 24, "tutori": 24, "api": 24, "refer": 24, "content": 25, "client": 26, "azureml_cli": 26, "aml_config_path": 26, "aml_config": 26, "field": 26, "input": [26, 27, 28], "inform": [26, 27], "local": [26, 29, 33, 35], "flow": 26, "quick": 27, "tour": [27, 28], "need": 27, "appli": 27, "advanc": 28, "user": 28, "self": 29, "kubernet": 29, "cluster": 29, "creat": 29, "aml": 29, "extens": 29, "link": 29, "machin": 29, "learn": 29, "list": 30, "manage_compute_inst": 30, "usag": 30, "To": [31, 32, 33, 34, 35], "support": 31, "templat": 31, "gener": 31, "titl": 31, "built": 31, "type": 32, "accuraci": 32, "latenc": 32, "throughput": 32, "multi": 32, "set": 33, "path": 33, "folder": 33, "string": 33, "name": 33, "remot": 33, "registri": 33, "readymad": 35, "docker": 35, "python": 35, "environ": 35}, "envversion": {"sphinx.domains.c": 3, "sphinx.domains.changeset": 1, "sphinx.domains.citation": 1, "sphinx.domains.cpp": 9, "sphinx.domains.index": 1, "sphinx.domains.javascript": 3, "sphinx.domains.math": 2, "sphinx.domains.python": 4, "sphinx.domains.rst": 2, "sphinx.domains.std": 2, "sphinx.ext.intersphinx": 1, "sphinx.ext.todo": 2, "sphinx.ext.viewcode": 1, "sphinx": 58}, "alltitles": {"Engine": [[0, "engine"], [0, "id2"], [9, "engine"], [28, "engine"]], "EngineConfig": [[0, "engineconfig"]], "SearchStrategy": [[0, "searchstrategy"]], "OliveEvaluator": [[1, "oliveevaluator"], [1, "id1"]], "Metric": [[2, "metric"], [2, "id2"]], "MetricType": [[2, "metrictype"]], "AccuracySubType": [[2, "accuracysubtype"]], "LatencySubType": [[2, "latencysubtype"]], "ThroughputSubType": [[2, "throughputsubtype"]], "MetricGoal": [[2, "metricgoal"]], "OliveModels": [[3, "olivemodels"]], "Model Configuration": [[3, "model-configuration"]], "ONNX Model": [[3, "onnx-model"]], "CompositeOnnxModel Model": [[3, "compositeonnxmodel-model"]], "DistributedOnnxModel Model": [[3, "distributedonnxmodel-model"]], "OpenVINO Model": [[3, "openvino-model"]], "PyTorch Model": [[3, "pytorch-model"]], "DistributedPyTorchModel Model": [[3, "distributedpytorchmodel-model"]], "SNPE Model": [[3, "snpe-model"]], "CompositePyTorchModel Model": [[3, "compositepytorchmodel-model"]], "Passes": [[4, "passes"]], "OnnxConversion": [[4, "onnxconversion"]], "OnnxOpVersionConversion": [[4, "onnxopversionconversion"]], "OnnxModelOptimizer": [[4, "onnxmodeloptimizer"]], "OrtTransformersOptimization": [[4, "orttransformersoptimization"]], "OrtPerfTuning": [[4, "ortperftuning"]], "OnnxFloatToFloat16": [[4, "onnxfloattofloat16"]], "OrtMixedPrecision": [[4, "ortmixedprecision"]], "OnnxDynamicQuantization": [[4, "onnxdynamicquantization"]], "OnnxStaticQuantization": [[4, "onnxstaticquantization"]], "OnnxQuantization": [[4, "onnxquantization"]], "IncDynamicQuantization": [[4, "incdynamicquantization"]], "IncStaticQuantization": [[4, "incstaticquantization"]], "IncQuantization": [[4, "incquantization"]], "AppendPrePostProcessingOps": [[4, "appendprepostprocessingops"]], "InsertBeamSearch": [[4, "insertbeamsearch"]], "LoRA": [[4, "lora"], [18, "lora"]], "QLoRA": [[4, "qlora"], [18, "qlora"]], "LoRA/QLoRA HFTrainingArguments": [[4, "lora-qlora-hftrainingarguments"]], "QuantizationAwareTraining": [[4, "quantizationawaretraining"]], "OpenVINOConversion": [[4, "openvinoconversion"]], "OpenVINOQuantization": [[4, "openvinoquantization"]], "SNPEConversion": [[4, "snpeconversion"]], "SNPEQuantization": [[4, "snpequantization"]], "SNPEtoONNXConversion": [[4, "snpetoonnxconversion"]], "SparseGPT": [[4, "sparsegpt"], [18, "sparsegpt"]], "TorchTRTConversion": [[4, "torchtrtconversion"], [18, "torchtrtconversion"]], "VitisAIQuantization": [[4, "vitisaiquantization"]], "OptimumConversion": [[4, "optimumconversion"]], "OptimumMerging": [[4, "optimummerging"]], "ResourcePath": [[5, "resourcepath"]], "ResourceType": [[5, "resourcetype"]], "LocalFile": [[5, "localfile"]], "LocalFolder": [[5, "localfolder"]], "StringName": [[5, "stringname"]], "AzureMLModel": [[5, "azuremlmodel"]], "AzureMLDatastore": [[5, "azuremldatastore"]], "AzureMLJobOutput": [[5, "azuremljoboutput"]], "SearchAlgorithms": [[6, "searchalgorithms"]], "ExhaustiveSearchAlgorithm": [[6, "exhaustivesearchalgorithm"]], "RandomSearchAlgorithm": [[6, "randomsearchalgorithm"]], "TPESearchAlgorithm": [[6, "tpesearchalgorithm"]], "OliveSystems": [[7, "olivesystems"]], "Config": [[7, "config"]], "SystemType": [[7, "systemtype"]], "LocalTargetUserConfig": [[7, "localtargetuserconfig"]], "DockerTargetUserConfig": [[7, "dockertargetuserconfig"]], "AzureMLTargetUserConfig": [[7, "azuremltargetuserconfig"]], "PythonEnvironmentTargetUserConfig": [[7, "pythonenvironmenttargetuserconfig"]], "Classes": [[7, "classes"]], "LocalSystem": [[7, "localsystem"]], "AzureMLSystem": [[7, "azuremlsystem"]], "DockerSystem": [[7, "dockersystem"]], "PythonEnvironmentSystem": [[7, "pythonenvironmentsystem"]], "System Alias": [[7, "module-olive.systems.system_alias"]], "Acceleration on CPU": [[8, "acceleration-on-cpu"]], "Acceleration on GPU": [[8, "acceleration-on-gpu"]], "Acceleration on NPU": [[8, "acceleration-on-npu"]], "Acceleration on DPU": [[8, "acceleration-on-dpu"]], "Design": [[9, "design"]], "Pass": [[9, "pass"]], "System": [[9, "system"]], "Evaluator": [[9, "evaluator"], [28, "evaluator"]], "Search Strategy": [[9, "search-strategy"]], "Execution Order": [[9, "execution-order"]], "Search Algorithm": [[9, "search-algorithm"]], "How to add new optimization Pass": [[10, "how-to-add-new-optimization-pass"]], "1. Define a new class": [[10, "define-a-new-class"]], "2. Define configuration": [[10, "define-configuration"]], "Example": [[10, "example"], [13, "example"], [26, "example"], [26, "id1"], [26, "id2"], [26, "id3"], [26, "id4"], [26, "id5"], [26, "id6"]], "3. Implement the run function": [[10, "implement-the-run-function"]], "Azure ML integration": [[11, "azure-ml-integration"]], "Olive Core": [[11, "olive-core"]], "Using AzureML registered model": [[11, "using-azureml-registered-model"]], "Using AzureML curated model": [[11, "using-azureml-curated-model"]], "Using model stored in AzureML datastore": [[11, "using-model-stored-in-azureml-datastore"]], "Using a model from an AzureML job output": [[11, "using-a-model-from-an-azureml-job-output"]], "Using data stored in AzureML datastore": [[11, "using-data-stored-in-azureml-datastore"]], "Using Azure ML compute as host or target": [[11, "using-azure-ml-compute-as-host-or-target"]], "Connect your own device to Azure ML as target or host by Azure Arc": [[11, "connect-your-own-device-to-azure-ml-as-target-or-host-by-azure-arc"]], "Azure ML Helper Scripts": [[11, "azure-ml-helper-scripts"]], "Custom Scripts": [[12, "custom-scripts"]], "user_script": [[12, "user-script"]], "Examples": [[12, "examples"], [12, "id1"]], "script_dir": [[12, "script-dir"]], "Huggingface Model Optimization": [[13, "huggingface-model-optimization"]], "Introduction": [[13, "introduction"]], "Model config and dataset config": [[13, "model-config-and-dataset-config"]], "Metric config": [[13, "metric-config"]], "Custom components config": [[13, "custom-components-config"]], "Script example": [[13, "script-example"]], "E2E example": [[13, "e2e-example"]], "Model Transformations and Optimizations": [[14, "model-transformations-and-optimizations"]], "Packaging Olive artifacts": [[15, "packaging-olive-artifacts"]], "What is Olive Packaging": [[15, "what-is-olive-packaging"]], "Zipfile": [[15, "zipfile"]], "CandidateModels": [[15, "candidatemodels"]], "Inference config file": [[15, "inference-config-file"]], "SampleCode": [[15, "samplecode"]], "How to package Olive artifacts": [[15, "how-to-package-olive-artifacts"]], "ONNX": [[16, "onnx"]], "Model Conversion": [[16, "model-conversion"], [17, "model-conversion"], [19, "model-conversion"]], "Example Configuration": [[16, "example-configuration"], [16, "id1"], [16, "id2"], [16, "id3"], [16, "id4"], [16, "id5"], [16, "id6"], [16, "id7"], [16, "id8"], [17, "example-configuration"], [17, "id1"], [18, "example-configuration"], [18, "id1"], [18, "id2"], [18, "id3"], [18, "id4"], [19, "example-configuration"], [19, "id1"]], "Model Optimizer": [[16, "model-optimizer"]], "ORT Transformers Optimization": [[16, "ort-transformers-optimization"]], "Append Pre/Post Processing Ops": [[16, "append-pre-post-processing-ops"]], "Insert Beam Search Op": [[16, "insert-beam-search-op"]], "Post Training Quantization (PTQ)": [[16, "post-training-quantization-ptq"], [17, "post-training-quantization-ptq"], [19, "post-training-quantization-ptq"]], "Quantize with onnxruntime": [[16, "quantize-with-onnxruntime"]], "Quantize with Intel\u00ae Neural Compressor": [[16, "quantize-with-intel-neural-compressor"]], "Quantize with AMD Vitis AI Quantizer": [[16, "quantize-with-amd-vitis-ai-quantizer"]], "ORT Performance Tuning": [[16, "ort-performance-tuning"]], "Float16 Conversion": [[16, "float16-conversion"]], "Mixed Precision Conversion": [[16, "mixed-precision-conversion"]], "OpenVINO": [[17, "openvino"]], "Prerequisites": [[17, "prerequisites"], [19, "prerequisites"], [21, "prerequisites"], [23, "prerequisites"], [35, "prerequisites"], [35, "id2"]], "Option 1: install Olive with OpenVINO extras": [[17, "option-1-install-olive-with-openvino-extras"]], "Option 2: Install OpenVINO Runtime and OpenVINO Development Tools from Pypi": [[17, "option-2-install-openvino-runtime-and-openvino-development-tools-from-pypi"]], "PyTorch": [[18, "pytorch"]], "Quantization Aware Training": [[18, "quantization-aware-training"]], "SNPE": [[19, "snpe"]], "Download and unzip SNPE SDK": [[19, "download-and-unzip-snpe-sdk"]], "Install SDK system dependencies": [[19, "install-sdk-system-dependencies"]], "Configure Olive SNPE": [[19, "configure-olive-snpe"]], "Installation": [[20, "installation"]], "Install with pip": [[20, "install-with-pip"]], "Install from source": [[20, "install-from-source"]], "Editable install": [[20, "editable-install"]], "Optional Dependencies": [[20, "optional-dependencies"]], "BERT optimization with PTQ on CPU": [[21, "bert-optimization-with-ptq-on-cpu"]], "Pip requirements": [[21, "pip-requirements"], [23, "pip-requirements"]], "Run sample using config. The optimization techniques to run are specified in bert_ptq_cpu.json": [[21, "run-sample-using-config-the-optimization-techniques-to-run-are-specified-in-bert-ptq-cpu-json"]], "Optimize model automatically without selecting any optimization technique.": [[21, "optimize-model-automatically-without-selecting-any-optimization-technique"]], "Quickstart Examples": [[22, "quickstart-examples"]], "ResNet optimization with PTQ on CPU": [[23, "resnet-optimization-with-ptq-on-cpu"]], "Prepare data and model": [[23, "prepare-data-and-model"]], "Run sample using config": [[23, "run-sample-using-config"]], "Welcome to Olive\u2019s documentation!": [[24, "welcome-to-olive-s-documentation"]], "OVERVIEW": [[24, null]], "GET STARTED": [[24, null]], "EXAMPLES": [[24, null]], "FEATURES": [[24, null]], "EXTENDING OLIVE": [[24, null]], "TUTORIALS": [[24, null]], "API REFERENCE": [[24, null]], "Olive": [[25, "olive"]], "Contents": [[25, "contents"]], "Olive Options": [[26, "olive-options"]], "Azure ML Client": [[26, "azure-ml-client"]], "azureml_client with aml_config_path:": [[26, "azureml-client-with-aml-config-path"]], "aml_config.json:": [[26, "aml-config-json"]], "azureml_client:": [[26, "azureml-client"]], "azureml_client with azureml config fields:": [[26, "azureml-client-with-azureml-config-fields"]], "Input Model Information": [[26, "input-model-information"]], "Data Information": [[26, "data-information"]], "Local Examples": [[26, "local-examples"]], "Azureml Examples": [[26, "azureml-examples"]], "Systems Information": [[26, "systems-information"]], "Evaluators Information": [[26, "evaluators-information"]], "Passes Information": [[26, "passes-information"]], "Pass Flows Information": [[26, "pass-flows-information"]], "Engine Information": [[26, "engine-information"]], "Quick Tour": [[27, "quick-tour"]], "Information needed to accelerate a model": [[27, "information-needed-to-accelerate-a-model"]], "Input Model": [[27, "input-model"], [28, "input-model"]], "Performance Requirement": [[27, "performance-requirement"]], "Passes to apply": [[27, "passes-to-apply"]], "Olive Engine": [[27, "olive-engine"]], "Advanced User Tour": [[28, "advanced-user-tour"]], "Host and Target Systems": [[28, "host-and-target-systems"]], "Register Passes": [[28, "register-passes"]], "Run the engine": [[28, "run-the-engine"]], "Self-hosted Kubernetes cluster": [[29, "self-hosted-kubernetes-cluster"]], "Create Kubernetes cluster": [[29, "create-kubernetes-cluster"]], "Add local Kubernetes cluster to Azure Arc": [[29, "add-local-kubernetes-cluster-to-azure-arc"]], "Add AML extension to cluster": [[29, "add-aml-extension-to-cluster"]], "Link Azure Arc Kubernetes cluster to Azure Machine Learning": [[29, "link-azure-arc-kubernetes-cluster-to-azure-machine-learning"]], "Azure ML scripts": [[30, "azure-ml-scripts"]], "Scripts list": [[30, "scripts-list"]], "manage_compute_instance": [[30, "manage-compute-instance"]], "Usage": [[30, "usage"]], "How To Configure Data": [[31, "how-to-configure-data"]], "Supported Data Config Template": [[31, "supported-data-config-template"]], "Generic Data Config": [[31, "generic-data-config"]], "Title": [[31, "id5"]], "Configs with built-in component:": [[31, "configs-with-built-in-component"]], "Configs with customized component:": [[31, "configs-with-customized-component"]], "How To Configure Metric": [[32, "how-to-configure-metric"]], "Metric Types": [[32, "metric-types"]], "Accuracy Metric": [[32, "accuracy-metric"]], "Latency Metric": [[32, "latency-metric"]], "Throughput Metric": [[32, "throughput-metric"]], "Custom Metric": [[32, "custom-metric"]], "Multi Metrics configuration": [[32, "multi-metrics-configuration"]], "How To Set Model Path": [[33, "how-to-set-model-path"]], "Local Model Path": [[33, "local-model-path"]], "Local File": [[33, "local-file"]], "Local Folder": [[33, "local-folder"]], "String Name": [[33, "string-name"]], "Remote Model Path": [[33, "remote-model-path"]], "AzureML Model": [[33, "azureml-model"]], "AzureML Registry Model": [[33, "azureml-registry-model"]], "AzureML Datastore": [[33, "azureml-datastore"]], "AzureML Job Output": [[33, "azureml-job-output"]], "How To Configure Pass": [[34, "how-to-configure-pass"]], "How To Configure System": [[35, "how-to-configure-system"]], "Local System": [[35, "local-system"]], "AzureML System": [[35, "azureml-system"]], "System Configuration": [[35, "system-configuration"], [35, "id3"]], "AzureML Readymade Systems": [[35, "azureml-readymade-systems"]], "Docker System": [[35, "docker-system"]], "Python Environment System": [[35, "python-environment-system"]]}, "indexentries": {"engine (class in olive.engine)": [[0, "olive.engine.Engine"]], "searchstrategy (class in olive.strategy.search_strategy)": [[0, "olive.strategy.search_strategy.SearchStrategy"]], "azureml_client_config (olive.engine.engineconfig attribute)": [[0, "olive.engine.EngineConfig.azureml_client_config"]], "cache_dir (olive.engine.engineconfig attribute)": [[0, "olive.engine.EngineConfig.cache_dir"]], "clean_cache (olive.engine.engineconfig attribute)": [[0, "olive.engine.EngineConfig.clean_cache"]], "clean_evaluation_cache (olive.engine.engineconfig attribute)": [[0, "olive.engine.EngineConfig.clean_evaluation_cache"]], "evaluator (olive.engine.engineconfig attribute)": [[0, "olive.engine.EngineConfig.evaluator"]], "execution_order (olive.strategy.search_strategy.searchstrategyconfig attribute)": [[0, "olive.strategy.search_strategy.SearchStrategyConfig.execution_order"]], "execution_providers (olive.engine.engineconfig attribute)": [[0, "olive.engine.EngineConfig.execution_providers"]], "host (olive.engine.engineconfig attribute)": [[0, "olive.engine.EngineConfig.host"]], "max_iter (olive.strategy.search_strategy.searchstrategyconfig attribute)": [[0, "olive.strategy.search_strategy.SearchStrategyConfig.max_iter"]], "max_time (olive.strategy.search_strategy.searchstrategyconfig attribute)": [[0, "olive.strategy.search_strategy.SearchStrategyConfig.max_time"]], "metrics (olive.evaluator.olive_evaluator.oliveevaluatorconfig attribute)": [[0, "olive.evaluator.olive_evaluator.OliveEvaluatorConfig.metrics"]], "output_model_num (olive.strategy.search_strategy.searchstrategyconfig attribute)": [[0, "olive.strategy.search_strategy.SearchStrategyConfig.output_model_num"]], "packaging_config (olive.engine.engineconfig attribute)": [[0, "olive.engine.EngineConfig.packaging_config"]], "plot_pareto_frontier (olive.engine.engineconfig attribute)": [[0, "olive.engine.EngineConfig.plot_pareto_frontier"]], "register() (olive.engine.engine method)": [[0, "olive.engine.Engine.register"]], "run() (olive.engine.engine method)": [[0, "olive.engine.Engine.run"]], "search_algorithm (olive.strategy.search_strategy.searchstrategyconfig attribute)": [[0, "olive.strategy.search_strategy.SearchStrategyConfig.search_algorithm"]], "search_algorithm_config (olive.strategy.search_strategy.searchstrategyconfig attribute)": [[0, "olive.strategy.search_strategy.SearchStrategyConfig.search_algorithm_config"]], "search_strategy (olive.engine.engineconfig attribute)": [[0, "olive.engine.EngineConfig.search_strategy"]], "stop_when_goals_met (olive.strategy.search_strategy.searchstrategyconfig attribute)": [[0, "olive.strategy.search_strategy.SearchStrategyConfig.stop_when_goals_met"]], "target (olive.engine.engineconfig attribute)": [[0, "olive.engine.EngineConfig.target"]], "oliveevaluator (class in olive.evaluator.olive_evaluator)": [[1, "olive.evaluator.olive_evaluator.OliveEvaluator"]], "accuracy (olive.evaluator.metric.metrictype attribute)": [[2, "olive.evaluator.metric.MetricType.ACCURACY"]], "accuracy_score (olive.evaluator.metric.accuracysubtype attribute)": [[2, "olive.evaluator.metric.AccuracySubType.ACCURACY_SCORE"]], "auroc (olive.evaluator.metric.accuracysubtype attribute)": [[2, "olive.evaluator.metric.AccuracySubType.AUROC"]], "avg (olive.evaluator.metric.latencysubtype attribute)": [[2, "olive.evaluator.metric.LatencySubType.AVG"]], "avg (olive.evaluator.metric.throughputsubtype attribute)": [[2, "olive.evaluator.metric.ThroughputSubType.AVG"]], "accuracysubtype (class in olive.evaluator.metric)": [[2, "olive.evaluator.metric.AccuracySubType"]], "custom (olive.evaluator.metric.metrictype attribute)": [[2, "olive.evaluator.metric.MetricType.CUSTOM"]], "f1_score (olive.evaluator.metric.accuracysubtype attribute)": [[2, "olive.evaluator.metric.AccuracySubType.F1_SCORE"]], "latency (olive.evaluator.metric.metrictype attribute)": [[2, "olive.evaluator.metric.MetricType.LATENCY"]], "latencysubtype (class in olive.evaluator.metric)": [[2, "olive.evaluator.metric.LatencySubType"]], "max (olive.evaluator.metric.latencysubtype attribute)": [[2, "olive.evaluator.metric.LatencySubType.MAX"]], "max (olive.evaluator.metric.throughputsubtype attribute)": [[2, "olive.evaluator.metric.ThroughputSubType.MAX"]], "min (olive.evaluator.metric.latencysubtype attribute)": [[2, "olive.evaluator.metric.LatencySubType.MIN"]], "min (olive.evaluator.metric.throughputsubtype attribute)": [[2, "olive.evaluator.metric.ThroughputSubType.MIN"]], "metrictype (class in olive.evaluator.metric)": [[2, "olive.evaluator.metric.MetricType"]], "p50 (olive.evaluator.metric.latencysubtype attribute)": [[2, "olive.evaluator.metric.LatencySubType.P50"]], "p50 (olive.evaluator.metric.throughputsubtype attribute)": [[2, "olive.evaluator.metric.ThroughputSubType.P50"]], "p75 (olive.evaluator.metric.latencysubtype attribute)": [[2, "olive.evaluator.metric.LatencySubType.P75"]], "p75 (olive.evaluator.metric.throughputsubtype attribute)": [[2, "olive.evaluator.metric.ThroughputSubType.P75"]], "p90 (olive.evaluator.metric.latencysubtype attribute)": [[2, "olive.evaluator.metric.LatencySubType.P90"]], "p90 (olive.evaluator.metric.throughputsubtype attribute)": [[2, "olive.evaluator.metric.ThroughputSubType.P90"]], "p95 (olive.evaluator.metric.latencysubtype attribute)": [[2, "olive.evaluator.metric.LatencySubType.P95"]], "p95 (olive.evaluator.metric.throughputsubtype attribute)": [[2, "olive.evaluator.metric.ThroughputSubType.P95"]], "p99 (olive.evaluator.metric.latencysubtype attribute)": [[2, "olive.evaluator.metric.LatencySubType.P99"]], "p99 (olive.evaluator.metric.throughputsubtype attribute)": [[2, "olive.evaluator.metric.ThroughputSubType.P99"]], "p999 (olive.evaluator.metric.latencysubtype attribute)": [[2, "olive.evaluator.metric.LatencySubType.P999"]], "p999 (olive.evaluator.metric.throughputsubtype attribute)": [[2, "olive.evaluator.metric.ThroughputSubType.P999"]], "perplexity (olive.evaluator.metric.accuracysubtype attribute)": [[2, "olive.evaluator.metric.AccuracySubType.PERPLEXITY"]], "precision (olive.evaluator.metric.accuracysubtype attribute)": [[2, "olive.evaluator.metric.AccuracySubType.PRECISION"]], "recall (olive.evaluator.metric.accuracysubtype attribute)": [[2, "olive.evaluator.metric.AccuracySubType.RECALL"]], "throughput (olive.evaluator.metric.metrictype attribute)": [[2, "olive.evaluator.metric.MetricType.THROUGHPUT"]], "throughputsubtype (class in olive.evaluator.metric)": [[2, "olive.evaluator.metric.ThroughputSubType"]], "backend (olive.evaluator.metric.metric attribute)": [[2, "olive.evaluator.metric.Metric.backend"]], "data_config (olive.evaluator.metric.metric attribute)": [[2, "olive.evaluator.metric.Metric.data_config"]], "get_sub_type_info() (olive.evaluator.metric.metric method)": [[2, "olive.evaluator.metric.Metric.get_sub_type_info"]], "name (olive.evaluator.metric.metric attribute)": [[2, "olive.evaluator.metric.Metric.name"]], "sub_types (olive.evaluator.metric.metric attribute)": [[2, "olive.evaluator.metric.Metric.sub_types"]], "type (olive.evaluator.metric.metric attribute)": [[2, "olive.evaluator.metric.Metric.type"]], "type (olive.evaluator.metric.metricgoal attribute)": [[2, "olive.evaluator.metric.MetricGoal.type"]], "user_config (olive.evaluator.metric.metric attribute)": [[2, "olive.evaluator.metric.Metric.user_config"]], "value (olive.evaluator.metric.metricgoal attribute)": [[2, "olive.evaluator.metric.MetricGoal.value"]], "compositeonnxmodel (class in olive.model)": [[3, "olive.model.CompositeOnnxModel"]], "compositepytorchmodel (class in olive.model)": [[3, "olive.model.CompositePyTorchModel"]], "distributedonnxmodel (class in olive.model)": [[3, "olive.model.DistributedOnnxModel"]], "distributedpytorchmodel (class in olive.model)": [[3, "olive.model.DistributedPyTorchModel"]], "modelconfig (class in olive.model)": [[3, "olive.model.ModelConfig"]], "onnxmodel (class in olive.model)": [[3, "olive.model.ONNXModel"]], "openvinomodel (class in olive.model)": [[3, "olive.model.OpenVINOModel"]], "pytorchmodel (class in olive.model)": [[3, "olive.model.PyTorchModel"]], "snpemodel (class in olive.model)": [[3, "olive.model.SNPEModel"]], "activationsymmetric": [[4, "cmdoption-arg-223"], [4, "cmdoption-arg-51"], [4, "cmdoption-arg-81"], [4, "cmdoption-arg-ActivationSymmetric"]], "addqdqpairtoweight": [[4, "cmdoption-arg-AddQDQPairToWeight"]], "enablesubgraph": [[4, "cmdoption-arg-53"], [4, "cmdoption-arg-83"], [4, "cmdoption-arg-EnableSubgraph"]], "forcequantizenoinputcheck": [[4, "cmdoption-arg-54"], [4, "cmdoption-arg-84"], [4, "cmdoption-arg-ForceQuantizeNoInputCheck"]], "matmulconstbonly": [[4, "cmdoption-arg-55"], [4, "cmdoption-arg-85"], [4, "cmdoption-arg-MatMulConstBOnly"]], "weightsymmetric": [[4, "cmdoption-arg-224"], [4, "cmdoption-arg-52"], [4, "cmdoption-arg-82"], [4, "cmdoption-arg-WeightSymmetric"]], "activation_type": [[4, "cmdoption-arg-222"], [4, "cmdoption-arg-79"], [4, "cmdoption-arg-activation_type"]], "algorithms": [[4, "cmdoption-arg-algorithms"]], "all_tensors_to_one_file": [[4, "cmdoption-arg-12"], [4, "cmdoption-arg-120"], [4, "cmdoption-arg-146"], [4, "cmdoption-arg-152"], [4, "cmdoption-arg-158"], [4, "cmdoption-arg-197"], [4, "cmdoption-arg-2"], [4, "cmdoption-arg-20"], [4, "cmdoption-arg-227"], [4, "cmdoption-arg-238"], [4, "cmdoption-arg-243"], [4, "cmdoption-arg-26"], [4, "cmdoption-arg-31"], [4, "cmdoption-arg-58"], [4, "cmdoption-arg-7"], [4, "cmdoption-arg-88"], [4, "cmdoption-arg-95"], [4, "cmdoption-arg-all_tensors_to_one_file"]], "allow_tf32": [[4, "cmdoption-arg-171"], [4, "cmdoption-arg-allow_tf32"]], "approach": [[4, "cmdoption-arg-101"], [4, "cmdoption-arg-126"], [4, "cmdoption-arg-approach"]], "atol": [[4, "cmdoption-arg-atol"]], "backend": [[4, "cmdoption-arg-103"], [4, "cmdoption-arg-128"], [4, "cmdoption-arg-backend"]], "batch_size": [[4, "cmdoption-arg-114"], [4, "cmdoption-arg-139"], [4, "cmdoption-arg-183"], [4, "cmdoption-arg-211"], [4, "cmdoption-arg-46"], [4, "cmdoption-arg-73"], [4, "cmdoption-arg-batch_size"]], "bias": [[4, "cmdoption-arg-168"], [4, "cmdoption-arg-bias"]], "blocksize": [[4, "cmdoption-arg-blocksize"]], "calibrate_method": [[4, "cmdoption-arg-220"], [4, "cmdoption-arg-77"], [4, "cmdoption-arg-calibrate_method"]], "calibration_sampling_size": [[4, "cmdoption-arg-144"], [4, "cmdoption-arg-calibration_sampling_size"]], "checkpoint_path": [[4, "cmdoption-arg-checkpoint_path"]], "command line option": [[4, "cmdoption-arg-0"], [4, "cmdoption-arg-1"], [4, "cmdoption-arg-10"], [4, "cmdoption-arg-100"], [4, "cmdoption-arg-101"], [4, "cmdoption-arg-102"], [4, "cmdoption-arg-103"], [4, "cmdoption-arg-104"], [4, "cmdoption-arg-105"], [4, "cmdoption-arg-106"], [4, "cmdoption-arg-107"], [4, "cmdoption-arg-108"], [4, "cmdoption-arg-109"], [4, "cmdoption-arg-11"], [4, "cmdoption-arg-110"], [4, "cmdoption-arg-111"], [4, "cmdoption-arg-112"], [4, "cmdoption-arg-113"], [4, "cmdoption-arg-114"], [4, "cmdoption-arg-115"], [4, "cmdoption-arg-116"], [4, "cmdoption-arg-117"], [4, "cmdoption-arg-118"], [4, "cmdoption-arg-119"], [4, "cmdoption-arg-12"], [4, "cmdoption-arg-120"], [4, "cmdoption-arg-121"], [4, "cmdoption-arg-122"], [4, "cmdoption-arg-123"], [4, "cmdoption-arg-124"], [4, "cmdoption-arg-125"], [4, "cmdoption-arg-126"], [4, "cmdoption-arg-127"], [4, "cmdoption-arg-128"], [4, "cmdoption-arg-129"], [4, "cmdoption-arg-13"], [4, "cmdoption-arg-130"], [4, "cmdoption-arg-131"], [4, "cmdoption-arg-132"], [4, "cmdoption-arg-133"], [4, "cmdoption-arg-134"], [4, "cmdoption-arg-135"], [4, "cmdoption-arg-136"], [4, "cmdoption-arg-137"], [4, "cmdoption-arg-138"], [4, "cmdoption-arg-139"], [4, "cmdoption-arg-14"], [4, "cmdoption-arg-140"], [4, "cmdoption-arg-141"], [4, "cmdoption-arg-142"], [4, "cmdoption-arg-143"], [4, "cmdoption-arg-144"], [4, "cmdoption-arg-145"], [4, "cmdoption-arg-146"], [4, "cmdoption-arg-147"], [4, "cmdoption-arg-148"], [4, "cmdoption-arg-149"], [4, "cmdoption-arg-15"], [4, "cmdoption-arg-150"], [4, "cmdoption-arg-151"], [4, "cmdoption-arg-152"], [4, "cmdoption-arg-153"], [4, "cmdoption-arg-154"], [4, "cmdoption-arg-155"], [4, "cmdoption-arg-156"], [4, "cmdoption-arg-157"], [4, "cmdoption-arg-158"], [4, "cmdoption-arg-159"], [4, "cmdoption-arg-16"], [4, "cmdoption-arg-160"], [4, "cmdoption-arg-161"], [4, "cmdoption-arg-162"], [4, "cmdoption-arg-163"], [4, "cmdoption-arg-164"], [4, "cmdoption-arg-165"], [4, "cmdoption-arg-166"], [4, "cmdoption-arg-167"], [4, "cmdoption-arg-168"], [4, "cmdoption-arg-169"], [4, "cmdoption-arg-17"], [4, "cmdoption-arg-170"], [4, "cmdoption-arg-171"], [4, "cmdoption-arg-172"], [4, "cmdoption-arg-173"], [4, "cmdoption-arg-174"], [4, "cmdoption-arg-175"], [4, "cmdoption-arg-176"], [4, "cmdoption-arg-177"], [4, "cmdoption-arg-178"], [4, "cmdoption-arg-179"], [4, "cmdoption-arg-18"], [4, "cmdoption-arg-180"], [4, "cmdoption-arg-181"], [4, "cmdoption-arg-182"], [4, "cmdoption-arg-183"], [4, "cmdoption-arg-184"], [4, "cmdoption-arg-185"], [4, "cmdoption-arg-186"], [4, "cmdoption-arg-187"], [4, "cmdoption-arg-188"], [4, "cmdoption-arg-189"], [4, "cmdoption-arg-19"], [4, "cmdoption-arg-190"], [4, "cmdoption-arg-191"], [4, "cmdoption-arg-192"], [4, "cmdoption-arg-193"], [4, "cmdoption-arg-194"], [4, "cmdoption-arg-195"], [4, "cmdoption-arg-196"], [4, "cmdoption-arg-197"], [4, "cmdoption-arg-198"], [4, "cmdoption-arg-199"], [4, "cmdoption-arg-2"], [4, "cmdoption-arg-20"], [4, "cmdoption-arg-200"], [4, "cmdoption-arg-201"], [4, "cmdoption-arg-202"], [4, "cmdoption-arg-203"], [4, "cmdoption-arg-204"], [4, "cmdoption-arg-205"], [4, "cmdoption-arg-206"], [4, "cmdoption-arg-207"], [4, "cmdoption-arg-208"], [4, "cmdoption-arg-209"], [4, "cmdoption-arg-21"], [4, "cmdoption-arg-210"], [4, "cmdoption-arg-211"], [4, "cmdoption-arg-212"], [4, "cmdoption-arg-213"], [4, "cmdoption-arg-214"], [4, "cmdoption-arg-215"], [4, "cmdoption-arg-216"], [4, "cmdoption-arg-217"], [4, "cmdoption-arg-218"], [4, "cmdoption-arg-219"], [4, "cmdoption-arg-22"], [4, "cmdoption-arg-220"], [4, "cmdoption-arg-221"], [4, "cmdoption-arg-222"], [4, "cmdoption-arg-223"], [4, "cmdoption-arg-224"], [4, "cmdoption-arg-225"], [4, "cmdoption-arg-226"], [4, "cmdoption-arg-227"], [4, "cmdoption-arg-228"], [4, "cmdoption-arg-229"], [4, "cmdoption-arg-23"], [4, "cmdoption-arg-230"], [4, "cmdoption-arg-231"], [4, "cmdoption-arg-232"], [4, "cmdoption-arg-233"], [4, "cmdoption-arg-234"], [4, "cmdoption-arg-235"], [4, "cmdoption-arg-236"], [4, "cmdoption-arg-237"], [4, "cmdoption-arg-238"], [4, "cmdoption-arg-239"], [4, "cmdoption-arg-24"], [4, "cmdoption-arg-240"], [4, "cmdoption-arg-241"], [4, "cmdoption-arg-242"], [4, "cmdoption-arg-243"], [4, "cmdoption-arg-244"], [4, "cmdoption-arg-245"], [4, "cmdoption-arg-246"], [4, "cmdoption-arg-25"], [4, "cmdoption-arg-26"], [4, "cmdoption-arg-27"], [4, "cmdoption-arg-28"], [4, "cmdoption-arg-29"], [4, "cmdoption-arg-3"], [4, "cmdoption-arg-30"], [4, "cmdoption-arg-31"], [4, "cmdoption-arg-32"], [4, "cmdoption-arg-33"], [4, "cmdoption-arg-34"], [4, "cmdoption-arg-35"], [4, "cmdoption-arg-36"], [4, "cmdoption-arg-37"], [4, "cmdoption-arg-38"], [4, "cmdoption-arg-39"], [4, "cmdoption-arg-4"], [4, "cmdoption-arg-40"], [4, "cmdoption-arg-41"], [4, "cmdoption-arg-42"], [4, "cmdoption-arg-43"], [4, "cmdoption-arg-44"], [4, "cmdoption-arg-45"], [4, "cmdoption-arg-46"], [4, "cmdoption-arg-47"], [4, "cmdoption-arg-48"], [4, "cmdoption-arg-49"], [4, "cmdoption-arg-5"], [4, "cmdoption-arg-50"], [4, "cmdoption-arg-51"], [4, "cmdoption-arg-52"], [4, "cmdoption-arg-53"], [4, "cmdoption-arg-54"], [4, "cmdoption-arg-55"], [4, "cmdoption-arg-56"], [4, "cmdoption-arg-57"], [4, "cmdoption-arg-58"], [4, "cmdoption-arg-59"], [4, "cmdoption-arg-6"], [4, "cmdoption-arg-60"], [4, "cmdoption-arg-61"], [4, "cmdoption-arg-62"], [4, "cmdoption-arg-63"], [4, "cmdoption-arg-64"], [4, "cmdoption-arg-65"], [4, "cmdoption-arg-66"], [4, "cmdoption-arg-67"], [4, "cmdoption-arg-68"], [4, "cmdoption-arg-69"], [4, "cmdoption-arg-7"], [4, "cmdoption-arg-70"], [4, "cmdoption-arg-71"], [4, "cmdoption-arg-72"], [4, "cmdoption-arg-73"], [4, "cmdoption-arg-74"], [4, "cmdoption-arg-75"], [4, "cmdoption-arg-76"], [4, "cmdoption-arg-77"], [4, "cmdoption-arg-78"], [4, "cmdoption-arg-79"], [4, "cmdoption-arg-8"], [4, "cmdoption-arg-80"], [4, "cmdoption-arg-81"], [4, "cmdoption-arg-82"], [4, "cmdoption-arg-83"], [4, "cmdoption-arg-84"], [4, "cmdoption-arg-85"], [4, "cmdoption-arg-86"], [4, "cmdoption-arg-87"], [4, "cmdoption-arg-88"], [4, "cmdoption-arg-89"], [4, "cmdoption-arg-9"], [4, "cmdoption-arg-90"], [4, "cmdoption-arg-91"], [4, "cmdoption-arg-92"], [4, "cmdoption-arg-93"], [4, "cmdoption-arg-94"], [4, "cmdoption-arg-95"], [4, "cmdoption-arg-96"], [4, "cmdoption-arg-97"], [4, "cmdoption-arg-98"], [4, "cmdoption-arg-99"], [4, "cmdoption-arg-ActivationSymmetric"], [4, "cmdoption-arg-AddQDQPairToWeight"], [4, "cmdoption-arg-EnableSubgraph"], [4, "cmdoption-arg-ForceQuantizeNoInputCheck"], [4, "cmdoption-arg-MatMulConstBOnly"], [4, "cmdoption-arg-WeightSymmetric"], [4, "cmdoption-arg-activation_type"], [4, "cmdoption-arg-algorithms"], [4, "cmdoption-arg-all_tensors_to_one_file"], [4, "cmdoption-arg-allow_tf32"], [4, "cmdoption-arg-approach"], [4, "cmdoption-arg-atol"], [4, "cmdoption-arg-backend"], [4, "cmdoption-arg-batch_size"], [4, "cmdoption-arg-bias"], [4, "cmdoption-arg-blocksize"], [4, "cmdoption-arg-calibrate_method"], [4, "cmdoption-arg-calibration_sampling_size"], [4, "cmdoption-arg-checkpoint_path"], [4, "cmdoption-arg-compute_device"], [4, "cmdoption-arg-compute_dtype"], [4, "cmdoption-arg-convert_attribute"], [4, "cmdoption-arg-cpu_cores"], [4, "cmdoption-arg-data_config"], [4, "cmdoption-arg-data_dir"], [4, "cmdoption-arg-dataloader_func"], [4, "cmdoption-arg-dataloader_func_kwargs"], [4, "cmdoption-arg-device"], [4, "cmdoption-arg-disable_shape_infer"], [4, "cmdoption-arg-do_validate"], [4, "cmdoption-arg-domain"], [4, "cmdoption-arg-double_quant"], [4, "cmdoption-arg-enable_cuda_graph"], [4, "cmdoption-arg-enable_dpu"], [4, "cmdoption-arg-enable_htp"], [4, "cmdoption-arg-engine_config"], [4, "cmdoption-arg-eval_data_config"], [4, "cmdoption-arg-eval_dataset_size"], [4, "cmdoption-arg-excluded_precisions"], [4, "cmdoption-arg-execution_mode_list"], [4, "cmdoption-arg-external_data_name"], [4, "cmdoption-arg-extra.Sigmoid.nnapi"], [4, "cmdoption-arg-extra_args"], [4, "cmdoption-arg-extra_config"], [4, "cmdoption-arg-extra_options"], [4, "cmdoption-arg-extra_session_config"], [4, "cmdoption-arg-float16"], [4, "cmdoption-arg-force_fp16_inputs"], [4, "cmdoption-arg-force_fp32_nodes"], [4, "cmdoption-arg-force_fp32_ops"], [4, "cmdoption-arg-fp16"], [4, "cmdoption-arg-gpus"], [4, "cmdoption-arg-hidden_size"], [4, "cmdoption-arg-htp_socs"], [4, "cmdoption-arg-input"], [4, "cmdoption-arg-input_int32"], [4, "cmdoption-arg-input_layouts"], [4, "cmdoption-arg-input_names"], [4, "cmdoption-arg-input_nodes"], [4, "cmdoption-arg-input_shape"], [4, "cmdoption-arg-input_shapes"], [4, "cmdoption-arg-input_types"], [4, "cmdoption-arg-inter_thread_num_list"], [4, "cmdoption-arg-intra_thread_num_list"], [4, "cmdoption-arg-io_bind"], [4, "cmdoption-arg-keep_io_types"], [4, "cmdoption-arg-layer_name_filter"], [4, "cmdoption-arg-logger"], [4, "cmdoption-arg-lora_alpha"], [4, "cmdoption-arg-lora_dropout"], [4, "cmdoption-arg-lora_r"], [4, "cmdoption-arg-max_finite_val"], [4, "cmdoption-arg-max_layer"], [4, "cmdoption-arg-metric"], [4, "cmdoption-arg-metric_func"], [4, "cmdoption-arg-min_layer"], [4, "cmdoption-arg-min_positive_val"], [4, "cmdoption-arg-model_type"], [4, "cmdoption-arg-modules_to_fuse"], [4, "cmdoption-arg-modules_to_save"], [4, "cmdoption-arg-need_layer_fusing"], [4, "cmdoption-arg-no_post_process"], [4, "cmdoption-arg-no_repeat_ngram_size"], [4, "cmdoption-arg-node_block_list"], [4, "cmdoption-arg-nodes_to_exclude"], [4, "cmdoption-arg-nodes_to_quantize"], [4, "cmdoption-arg-num_epochs"], [4, "cmdoption-arg-num_heads"], [4, "cmdoption-arg-num_steps"], [4, "cmdoption-arg-only_onnxruntime"], [4, "cmdoption-arg-op_block_list"], [4, "cmdoption-arg-op_type_dict"], [4, "cmdoption-arg-op_types_to_quantize"], [4, "cmdoption-arg-opt_level"], [4, "cmdoption-arg-opt_level_list"], [4, "cmdoption-arg-optimization_options"], [4, "cmdoption-arg-optimize_model"], [4, "cmdoption-arg-ortmodule_onnx_opset_version"], [4, "cmdoption-arg-output_names"], [4, "cmdoption-arg-output_nodes"], [4, "cmdoption-arg-parallel_jobs"], [4, "cmdoption-arg-per_channel"], [4, "cmdoption-arg-percdamp"], [4, "cmdoption-arg-post"], [4, "cmdoption-arg-pre"], [4, "cmdoption-arg-providers_list"], [4, "cmdoption-arg-ptl_data_module"], [4, "cmdoption-arg-ptl_module"], [4, "cmdoption-arg-qconfig_func"], [4, "cmdoption-arg-quant_format"], [4, "cmdoption-arg-quant_level"], [4, "cmdoption-arg-quant_mode"], [4, "cmdoption-arg-quant_preprocess"], [4, "cmdoption-arg-quant_type"], [4, "cmdoption-arg-recipes"], [4, "cmdoption-arg-reduce_range"], [4, "cmdoption-arg-save_as_external_data"], [4, "cmdoption-arg-script_dir"], [4, "cmdoption-arg-seed"], [4, "cmdoption-arg-size_threshold"], [4, "cmdoption-arg-sparsity"], [4, "cmdoption-arg-strict"], [4, "cmdoption-arg-target_device"], [4, "cmdoption-arg-target_modules"], [4, "cmdoption-arg-target_opset"], [4, "cmdoption-arg-tool_command"], [4, "cmdoption-arg-tool_command_args"], [4, "cmdoption-arg-torch_dtype"], [4, "cmdoption-arg-train_batch_size"], [4, "cmdoption-arg-train_data_config"], [4, "cmdoption-arg-train_data_dir"], [4, "cmdoption-arg-train_dataloader_func"], [4, "cmdoption-arg-training_args"], [4, "cmdoption-arg-training_loop_func"], [4, "cmdoption-arg-trt_fp16_enable"], [4, "cmdoption-arg-tuning_criterion"], [4, "cmdoption-arg-use_device"], [4, "cmdoption-arg-use_dynamo_exporter"], [4, "cmdoption-arg-use_enhanced_quantizer"], [4, "cmdoption-arg-use_external_data_format"], [4, "cmdoption-arg-use_forced_decoder_ids"], [4, "cmdoption-arg-use_gpu"], [4, "cmdoption-arg-use_gqa"], [4, "cmdoption-arg-use_ort_trainer"], [4, "cmdoption-arg-user_script"], [4, "cmdoption-arg-val_data_dir"], [4, "cmdoption-arg-weight_only_config"], [4, "cmdoption-arg-weight_type"], [5, "cmdoption-arg-0"], [5, "cmdoption-arg-1"], [5, "cmdoption-arg-2"], [5, "cmdoption-arg-3"], [5, "cmdoption-arg-4"], [5, "cmdoption-arg-azureml_client"], [5, "cmdoption-arg-datastore_name"], [5, "cmdoption-arg-datastore_url"], [5, "cmdoption-arg-job_name"], [5, "cmdoption-arg-name"], [5, "cmdoption-arg-output_name"], [5, "cmdoption-arg-path"], [5, "cmdoption-arg-relative_path"], [5, "cmdoption-arg-version"], [6, "cmdoption-arg-0"], [6, "cmdoption-arg-1"], [6, "cmdoption-arg-group"], [6, "cmdoption-arg-multivariate"], [6, "cmdoption-arg-num_samples"], [6, "cmdoption-arg-seed"], [6, "cmdoption-arg-with_replacement"]], "compute_device": [[4, "cmdoption-arg-compute_device"]], "compute_dtype": [[4, "cmdoption-arg-compute_dtype"]], "convert_attribute": [[4, "cmdoption-arg-10"], [4, "cmdoption-arg-123"], [4, "cmdoption-arg-149"], [4, "cmdoption-arg-15"], [4, "cmdoption-arg-155"], [4, "cmdoption-arg-161"], [4, "cmdoption-arg-200"], [4, "cmdoption-arg-23"], [4, "cmdoption-arg-230"], [4, "cmdoption-arg-241"], [4, "cmdoption-arg-246"], [4, "cmdoption-arg-29"], [4, "cmdoption-arg-34"], [4, "cmdoption-arg-5"], [4, "cmdoption-arg-61"], [4, "cmdoption-arg-91"], [4, "cmdoption-arg-98"], [4, "cmdoption-arg-convert_attribute"]], "cpu_cores": [[4, "cmdoption-arg-cpu_cores"]], "create_training_args() (olive.passes.pytorch.lora.hftrainingarguments method)": [[4, "olive.passes.pytorch.lora.HFTrainingArguments.create_training_args"]], "data_config": [[4, "cmdoption-arg-117"], [4, "cmdoption-arg-142"], [4, "cmdoption-arg-184"], [4, "cmdoption-arg-193"], [4, "cmdoption-arg-201"], [4, "cmdoption-arg-206"], [4, "cmdoption-arg-49"], [4, "cmdoption-arg-76"], [4, "cmdoption-arg-data_config"]], "data_dir": [[4, "cmdoption-arg-113"], [4, "cmdoption-arg-138"], [4, "cmdoption-arg-182"], [4, "cmdoption-arg-190"], [4, "cmdoption-arg-210"], [4, "cmdoption-arg-45"], [4, "cmdoption-arg-72"], [4, "cmdoption-arg-data_dir"]], "data_seed (olive.passes.pytorch.lora.hftrainingarguments attribute)": [[4, "olive.passes.pytorch.lora.HFTrainingArguments.data_seed"]], "dataloader_func": [[4, "cmdoption-arg-115"], [4, "cmdoption-arg-140"], [4, "cmdoption-arg-180"], [4, "cmdoption-arg-191"], [4, "cmdoption-arg-212"], [4, "cmdoption-arg-47"], [4, "cmdoption-arg-74"], [4, "cmdoption-arg-dataloader_func"]], "dataloader_func_kwargs": [[4, "cmdoption-arg-116"], [4, "cmdoption-arg-141"], [4, "cmdoption-arg-181"], [4, "cmdoption-arg-192"], [4, "cmdoption-arg-213"], [4, "cmdoption-arg-48"], [4, "cmdoption-arg-75"], [4, "cmdoption-arg-dataloader_func_kwargs"]], "device": [[4, "cmdoption-arg-102"], [4, "cmdoption-arg-127"], [4, "cmdoption-arg-235"], [4, "cmdoption-arg-92"], [4, "cmdoption-arg-device"]], "disable_shape_infer": [[4, "cmdoption-arg-disable_shape_infer"]], "do_validate": [[4, "cmdoption-arg-do_validate"]], "domain": [[4, "cmdoption-arg-104"], [4, "cmdoption-arg-129"], [4, "cmdoption-arg-domain"]], "double_quant": [[4, "cmdoption-arg-double_quant"]], "enable_cuda_graph": [[4, "cmdoption-arg-enable_cuda_graph"]], "enable_dpu": [[4, "cmdoption-arg-enable_dpu"]], "enable_htp": [[4, "cmdoption-arg-enable_htp"]], "engine_config": [[4, "cmdoption-arg-engine_config"]], "eval_data_config": [[4, "cmdoption-arg-173"], [4, "cmdoption-arg-eval_data_config"]], "eval_dataset_size": [[4, "cmdoption-arg-174"], [4, "cmdoption-arg-eval_dataset_size"]], "eval_steps (olive.passes.pytorch.lora.hftrainingarguments attribute)": [[4, "olive.passes.pytorch.lora.HFTrainingArguments.eval_steps"]], "evaluation_strategy (olive.passes.pytorch.lora.hftrainingarguments attribute)": [[4, "olive.passes.pytorch.lora.HFTrainingArguments.evaluation_strategy"]], "excluded_precisions": [[4, "cmdoption-arg-108"], [4, "cmdoption-arg-133"], [4, "cmdoption-arg-excluded_precisions"]], "execution_mode_list": [[4, "cmdoption-arg-execution_mode_list"]], "external_data_name": [[4, "cmdoption-arg-121"], [4, "cmdoption-arg-13"], [4, "cmdoption-arg-147"], [4, "cmdoption-arg-153"], [4, "cmdoption-arg-159"], [4, "cmdoption-arg-198"], [4, "cmdoption-arg-21"], [4, "cmdoption-arg-228"], [4, "cmdoption-arg-239"], [4, "cmdoption-arg-244"], [4, "cmdoption-arg-27"], [4, "cmdoption-arg-3"], [4, "cmdoption-arg-32"], [4, "cmdoption-arg-59"], [4, "cmdoption-arg-8"], [4, "cmdoption-arg-89"], [4, "cmdoption-arg-96"], [4, "cmdoption-arg-external_data_name"]], "extra.sigmoid.nnapi": [[4, "cmdoption-arg-50"], [4, "cmdoption-arg-80"], [4, "cmdoption-arg-extra.Sigmoid.nnapi"]], "extra_args": [[4, "cmdoption-arg-194"], [4, "cmdoption-arg-236"], [4, "cmdoption-arg-extra_args"]], "extra_args (olive.passes.pytorch.lora.hftrainingarguments attribute)": [[4, "olive.passes.pytorch.lora.HFTrainingArguments.extra_args"]], "extra_config": [[4, "cmdoption-arg-extra_config"]], "extra_options": [[4, "cmdoption-arg-225"], [4, "cmdoption-arg-56"], [4, "cmdoption-arg-86"], [4, "cmdoption-arg-extra_options"]], "extra_session_config": [[4, "cmdoption-arg-extra_session_config"]], "float16": [[4, "cmdoption-arg-205"], [4, "cmdoption-arg-float16"]], "force_fp16_inputs": [[4, "cmdoption-arg-force_fp16_inputs"]], "force_fp32_nodes": [[4, "cmdoption-arg-force_fp32_nodes"]], "force_fp32_ops": [[4, "cmdoption-arg-force_fp32_ops"]], "fp16": [[4, "cmdoption-arg-234"], [4, "cmdoption-arg-fp16"]], "gpus": [[4, "cmdoption-arg-gpus"]], "gradient_accumulation_steps (olive.passes.pytorch.lora.hftrainingarguments attribute)": [[4, "olive.passes.pytorch.lora.HFTrainingArguments.gradient_accumulation_steps"]], "gradient_checkpointing (olive.passes.pytorch.lora.hftrainingarguments attribute)": [[4, "olive.passes.pytorch.lora.HFTrainingArguments.gradient_checkpointing"]], "group_by_length (olive.passes.pytorch.lora.hftrainingarguments attribute)": [[4, "olive.passes.pytorch.lora.HFTrainingArguments.group_by_length"]], "hidden_size": [[4, "cmdoption-arg-hidden_size"]], "htp_socs": [[4, "cmdoption-arg-htp_socs"]], "input": [[4, "cmdoption-arg-input"]], "input_int32": [[4, "cmdoption-arg-input_int32"]], "input_layouts": [[4, "cmdoption-arg-input_layouts"]], "input_names": [[4, "cmdoption-arg-185"], [4, "cmdoption-arg-input_names"]], "input_nodes": [[4, "cmdoption-arg-input_nodes"]], "input_shape": [[4, "cmdoption-arg-input_shape"]], "input_shapes": [[4, "cmdoption-arg-186"], [4, "cmdoption-arg-input_shapes"]], "input_types": [[4, "cmdoption-arg-187"], [4, "cmdoption-arg-input_types"]], "inter_thread_num_list": [[4, "cmdoption-arg-inter_thread_num_list"]], "intra_thread_num_list": [[4, "cmdoption-arg-intra_thread_num_list"]], "io_bind": [[4, "cmdoption-arg-io_bind"]], "keep_io_types": [[4, "cmdoption-arg-18"], [4, "cmdoption-arg-keep_io_types"]], "layer_name_filter": [[4, "cmdoption-arg-204"], [4, "cmdoption-arg-layer_name_filter"]], "learning_rate (olive.passes.pytorch.lora.hftrainingarguments attribute)": [[4, "olive.passes.pytorch.lora.HFTrainingArguments.learning_rate"]], "logger": [[4, "cmdoption-arg-logger"]], "logging_steps (olive.passes.pytorch.lora.hftrainingarguments attribute)": [[4, "olive.passes.pytorch.lora.HFTrainingArguments.logging_steps"]], "lora_alpha": [[4, "cmdoption-arg-166"], [4, "cmdoption-arg-lora_alpha"]], "lora_dropout": [[4, "cmdoption-arg-167"], [4, "cmdoption-arg-lora_dropout"]], "lora_r": [[4, "cmdoption-arg-165"], [4, "cmdoption-arg-lora_r"]], "lr_scheduler_type (olive.passes.pytorch.lora.hftrainingarguments attribute)": [[4, "olive.passes.pytorch.lora.HFTrainingArguments.lr_scheduler_type"]], "max_finite_val": [[4, "cmdoption-arg-max_finite_val"]], "max_layer": [[4, "cmdoption-arg-203"], [4, "cmdoption-arg-max_layer"]], "max_steps (olive.passes.pytorch.lora.hftrainingarguments attribute)": [[4, "olive.passes.pytorch.lora.HFTrainingArguments.max_steps"]], "metric": [[4, "cmdoption-arg-110"], [4, "cmdoption-arg-135"], [4, "cmdoption-arg-metric"]], "metric_func": [[4, "cmdoption-arg-metric_func"]], "min_layer": [[4, "cmdoption-arg-202"], [4, "cmdoption-arg-min_layer"]], "min_positive_val": [[4, "cmdoption-arg-min_positive_val"]], "model_type": [[4, "cmdoption-arg-model_type"]], "modules_to_fuse": [[4, "cmdoption-arg-modules_to_fuse"]], "modules_to_save": [[4, "cmdoption-arg-169"], [4, "cmdoption-arg-modules_to_save"]], "need_layer_fusing": [[4, "cmdoption-arg-need_layer_fusing"]], "no_post_process": [[4, "cmdoption-arg-no_post_process"]], "no_repeat_ngram_size": [[4, "cmdoption-arg-no_repeat_ngram_size"]], "node_block_list": [[4, "cmdoption-arg-node_block_list"]], "nodes_to_exclude": [[4, "cmdoption-arg-217"], [4, "cmdoption-arg-41"], [4, "cmdoption-arg-68"], [4, "cmdoption-arg-nodes_to_exclude"]], "nodes_to_quantize": [[4, "cmdoption-arg-216"], [4, "cmdoption-arg-40"], [4, "cmdoption-arg-67"], [4, "cmdoption-arg-nodes_to_quantize"]], "num_epochs": [[4, "cmdoption-arg-num_epochs"]], "num_heads": [[4, "cmdoption-arg-num_heads"]], "num_steps": [[4, "cmdoption-arg-num_steps"]], "only_onnxruntime": [[4, "cmdoption-arg-only_onnxruntime"]], "op_block_list": [[4, "cmdoption-arg-24"], [4, "cmdoption-arg-op_block_list"]], "op_type_dict": [[4, "cmdoption-arg-112"], [4, "cmdoption-arg-137"], [4, "cmdoption-arg-op_type_dict"]], "op_types_to_quantize": [[4, "cmdoption-arg-215"], [4, "cmdoption-arg-39"], [4, "cmdoption-arg-66"], [4, "cmdoption-arg-op_types_to_quantize"]], "opt_level": [[4, "cmdoption-arg-opt_level"]], "opt_level_list": [[4, "cmdoption-arg-opt_level_list"]], "optim (olive.passes.pytorch.lora.hftrainingarguments attribute)": [[4, "olive.passes.pytorch.lora.HFTrainingArguments.optim"]], "optimization_options": [[4, "cmdoption-arg-optimization_options"]], "optimize_model": [[4, "cmdoption-arg-optimize_model"]], "ortmodule_onnx_opset_version": [[4, "cmdoption-arg-164"], [4, "cmdoption-arg-ortmodule_onnx_opset_version"]], "output_dir (olive.passes.pytorch.lora.hftrainingarguments attribute)": [[4, "olive.passes.pytorch.lora.HFTrainingArguments.output_dir"]], "output_names": [[4, "cmdoption-arg-output_names"]], "output_nodes": [[4, "cmdoption-arg-output_nodes"]], "parallel_jobs": [[4, "cmdoption-arg-parallel_jobs"]], "per_channel": [[4, "cmdoption-arg-218"], [4, "cmdoption-arg-42"], [4, "cmdoption-arg-69"], [4, "cmdoption-arg-per_channel"]], "per_device_eval_batch_size (olive.passes.pytorch.lora.hftrainingarguments attribute)": [[4, "olive.passes.pytorch.lora.HFTrainingArguments.per_device_eval_batch_size"]], "per_device_train_batch_size (olive.passes.pytorch.lora.hftrainingarguments attribute)": [[4, "olive.passes.pytorch.lora.HFTrainingArguments.per_device_train_batch_size"]], "percdamp": [[4, "cmdoption-arg-percdamp"]], "post": [[4, "cmdoption-arg-post"]], "pre": [[4, "cmdoption-arg-pre"]], "providers_list": [[4, "cmdoption-arg-providers_list"]], "ptl_data_module": [[4, "cmdoption-arg-ptl_data_module"]], "ptl_module": [[4, "cmdoption-arg-ptl_module"]], "qconfig_func": [[4, "cmdoption-arg-qconfig_func"]], "quant_format": [[4, "cmdoption-arg-118"], [4, "cmdoption-arg-143"], [4, "cmdoption-arg-221"], [4, "cmdoption-arg-78"], [4, "cmdoption-arg-quant_format"]], "quant_level": [[4, "cmdoption-arg-107"], [4, "cmdoption-arg-132"], [4, "cmdoption-arg-quant_level"]], "quant_mode": [[4, "cmdoption-arg-209"], [4, "cmdoption-arg-37"], [4, "cmdoption-arg-64"], [4, "cmdoption-arg-quant_mode"]], "quant_preprocess": [[4, "cmdoption-arg-219"], [4, "cmdoption-arg-44"], [4, "cmdoption-arg-71"], [4, "cmdoption-arg-quant_preprocess"]], "quant_type": [[4, "cmdoption-arg-quant_type"]], "recipes": [[4, "cmdoption-arg-105"], [4, "cmdoption-arg-130"], [4, "cmdoption-arg-recipes"]], "reduce_range": [[4, "cmdoption-arg-106"], [4, "cmdoption-arg-131"], [4, "cmdoption-arg-43"], [4, "cmdoption-arg-70"], [4, "cmdoption-arg-93"], [4, "cmdoption-arg-reduce_range"]], "report_to (olive.passes.pytorch.lora.hftrainingarguments attribute)": [[4, "olive.passes.pytorch.lora.HFTrainingArguments.report_to"]], "save_as_external_data": [[4, "cmdoption-arg-1"], [4, "cmdoption-arg-11"], [4, "cmdoption-arg-119"], [4, "cmdoption-arg-145"], [4, "cmdoption-arg-151"], [4, "cmdoption-arg-157"], [4, "cmdoption-arg-19"], [4, "cmdoption-arg-196"], [4, "cmdoption-arg-226"], [4, "cmdoption-arg-237"], [4, "cmdoption-arg-242"], [4, "cmdoption-arg-25"], [4, "cmdoption-arg-30"], [4, "cmdoption-arg-57"], [4, "cmdoption-arg-6"], [4, "cmdoption-arg-87"], [4, "cmdoption-arg-94"], [4, "cmdoption-arg-save_as_external_data"]], "script_dir": [[4, "cmdoption-arg-124"], [4, "cmdoption-arg-16"], [4, "cmdoption-arg-176"], [4, "cmdoption-arg-178"], [4, "cmdoption-arg-188"], [4, "cmdoption-arg-207"], [4, "cmdoption-arg-231"], [4, "cmdoption-arg-35"], [4, "cmdoption-arg-62"], [4, "cmdoption-arg-99"], [4, "cmdoption-arg-script_dir"]], "seed": [[4, "cmdoption-arg-seed"], [6, "cmdoption-arg-1"], [6, "cmdoption-arg-seed"]], "seed (olive.passes.pytorch.lora.hftrainingarguments attribute)": [[4, "olive.passes.pytorch.lora.HFTrainingArguments.seed"]], "size_threshold": [[4, "cmdoption-arg-122"], [4, "cmdoption-arg-14"], [4, "cmdoption-arg-148"], [4, "cmdoption-arg-154"], [4, "cmdoption-arg-160"], [4, "cmdoption-arg-199"], [4, "cmdoption-arg-22"], [4, "cmdoption-arg-229"], [4, "cmdoption-arg-240"], [4, "cmdoption-arg-245"], [4, "cmdoption-arg-28"], [4, "cmdoption-arg-33"], [4, "cmdoption-arg-4"], [4, "cmdoption-arg-60"], [4, "cmdoption-arg-9"], [4, "cmdoption-arg-90"], [4, "cmdoption-arg-97"], [4, "cmdoption-arg-size_threshold"]], "sparsity": [[4, "cmdoption-arg-sparsity"]], "strict": [[4, "cmdoption-arg-strict"]], "target_device": [[4, "cmdoption-arg-target_device"]], "target_modules": [[4, "cmdoption-arg-target_modules"]], "target_opset": [[4, "cmdoption-arg-0"], [4, "cmdoption-arg-150"], [4, "cmdoption-arg-195"], [4, "cmdoption-arg-233"], [4, "cmdoption-arg-target_opset"]], "tool_command": [[4, "cmdoption-arg-tool_command"]], "tool_command_args": [[4, "cmdoption-arg-tool_command_args"]], "torch_dtype": [[4, "cmdoption-arg-162"], [4, "cmdoption-arg-170"], [4, "cmdoption-arg-torch_dtype"]], "train_batch_size": [[4, "cmdoption-arg-train_batch_size"]], "train_data_config": [[4, "cmdoption-arg-172"], [4, "cmdoption-arg-train_data_config"]], "train_data_dir": [[4, "cmdoption-arg-train_data_dir"]], "train_dataloader_func": [[4, "cmdoption-arg-train_dataloader_func"]], "training_args": [[4, "cmdoption-arg-175"], [4, "cmdoption-arg-training_args"]], "training_loop_func": [[4, "cmdoption-arg-training_loop_func"]], "trt_fp16_enable": [[4, "cmdoption-arg-trt_fp16_enable"]], "tuning_criterion": [[4, "cmdoption-arg-109"], [4, "cmdoption-arg-134"], [4, "cmdoption-arg-tuning_criterion"]], "use_device": [[4, "cmdoption-arg-use_device"]], "use_dynamo_exporter": [[4, "cmdoption-arg-use_dynamo_exporter"]], "use_enhanced_quantizer": [[4, "cmdoption-arg-use_enhanced_quantizer"]], "use_external_data_format": [[4, "cmdoption-arg-use_external_data_format"]], "use_forced_decoder_ids": [[4, "cmdoption-arg-use_forced_decoder_ids"]], "use_gpu": [[4, "cmdoption-arg-156"], [4, "cmdoption-arg-use_gpu"]], "use_gqa": [[4, "cmdoption-arg-use_gqa"]], "use_ort_trainer": [[4, "cmdoption-arg-163"], [4, "cmdoption-arg-use_ort_trainer"]], "user_script": [[4, "cmdoption-arg-100"], [4, "cmdoption-arg-125"], [4, "cmdoption-arg-17"], [4, "cmdoption-arg-177"], [4, "cmdoption-arg-179"], [4, "cmdoption-arg-189"], [4, "cmdoption-arg-208"], [4, "cmdoption-arg-232"], [4, "cmdoption-arg-36"], [4, "cmdoption-arg-63"], [4, "cmdoption-arg-user_script"]], "val_data_dir": [[4, "cmdoption-arg-val_data_dir"]], "warmup_ratio (olive.passes.pytorch.lora.hftrainingarguments attribute)": [[4, "olive.passes.pytorch.lora.HFTrainingArguments.warmup_ratio"]], "weight_decay (olive.passes.pytorch.lora.hftrainingarguments attribute)": [[4, "olive.passes.pytorch.lora.HFTrainingArguments.weight_decay"]], "weight_only_config": [[4, "cmdoption-arg-111"], [4, "cmdoption-arg-136"], [4, "cmdoption-arg-weight_only_config"]], "weight_type": [[4, "cmdoption-arg-214"], [4, "cmdoption-arg-38"], [4, "cmdoption-arg-65"], [4, "cmdoption-arg-weight_type"]], "azuremldatastore (olive.resource_path.resourcetype attribute)": [[5, "olive.resource_path.ResourceType.AzureMLDatastore"]], "azuremljoboutput (olive.resource_path.resourcetype attribute)": [[5, "olive.resource_path.ResourceType.AzureMLJobOutput"]], "azuremlmodel (olive.resource_path.resourcetype attribute)": [[5, "olive.resource_path.ResourceType.AzureMLModel"]], "azuremlregistrymodel (olive.resource_path.resourcetype attribute)": [[5, "olive.resource_path.ResourceType.AzureMLRegistryModel"]], "localfile (olive.resource_path.resourcetype attribute)": [[5, "olive.resource_path.ResourceType.LocalFile"]], "localfolder (olive.resource_path.resourcetype attribute)": [[5, "olive.resource_path.ResourceType.LocalFolder"]], "resourcetype (class in olive.resource_path)": [[5, "olive.resource_path.ResourceType"]], "stringname (olive.resource_path.resourcetype attribute)": [[5, "olive.resource_path.ResourceType.StringName"]], "aml_config_path (olive.azureml.azureml_client.azuremlclientconfig attribute)": [[5, "olive.azureml.azureml_client.AzureMLClientConfig.aml_config_path"]], "azureml_client": [[5, "cmdoption-arg-2"], [5, "cmdoption-arg-3"], [5, "cmdoption-arg-azureml_client"]], "create_client() (olive.azureml.azureml_client.azuremlclientconfig method)": [[5, "olive.azureml.azureml_client.AzureMLClientConfig.create_client"]], "create_registry_client() (olive.azureml.azureml_client.azuremlclientconfig method)": [[5, "olive.azureml.azureml_client.AzureMLClientConfig.create_registry_client"]], "datastore_name": [[5, "cmdoption-arg-datastore_name"]], "datastore_url": [[5, "cmdoption-arg-datastore_url"]], "default_auth_params (olive.azureml.azureml_client.azuremlclientconfig attribute)": [[5, "olive.azureml.azureml_client.AzureMLClientConfig.default_auth_params"]], "get_workspace_config() (olive.azureml.azureml_client.azuremlclientconfig method)": [[5, "olive.azureml.azureml_client.AzureMLClientConfig.get_workspace_config"]], "job_name": [[5, "cmdoption-arg-job_name"]], "max_operation_retries (olive.azureml.azureml_client.azuremlclientconfig attribute)": [[5, "olive.azureml.azureml_client.AzureMLClientConfig.max_operation_retries"]], "name": [[5, "cmdoption-arg-1"], [5, "cmdoption-arg-name"]], "operation_retry_interval (olive.azureml.azureml_client.azuremlclientconfig attribute)": [[5, "olive.azureml.azureml_client.AzureMLClientConfig.operation_retry_interval"]], "output_name": [[5, "cmdoption-arg-output_name"]], "path": [[5, "cmdoption-arg-0"], [5, "cmdoption-arg-path"]], "read_timeout (olive.azureml.azureml_client.azuremlclientconfig attribute)": [[5, "olive.azureml.azureml_client.AzureMLClientConfig.read_timeout"]], "relative_path": [[5, "cmdoption-arg-4"], [5, "cmdoption-arg-relative_path"]], "resource_group (olive.azureml.azureml_client.azuremlclientconfig attribute)": [[5, "olive.azureml.azureml_client.AzureMLClientConfig.resource_group"]], "subscription_id (olive.azureml.azureml_client.azuremlclientconfig attribute)": [[5, "olive.azureml.azureml_client.AzureMLClientConfig.subscription_id"]], "version": [[5, "cmdoption-arg-version"]], "workspace_name (olive.azureml.azureml_client.azuremlclientconfig attribute)": [[5, "olive.azureml.azureml_client.AzureMLClientConfig.workspace_name"]], "group": [[6, "cmdoption-arg-group"]], "multivariate": [[6, "cmdoption-arg-multivariate"]], "num_samples": [[6, "cmdoption-arg-0"], [6, "cmdoption-arg-num_samples"]], "with_replacement": [[6, "cmdoption-arg-with_replacement"]], "azureml (olive.systems.common.systemtype attribute)": [[7, "olive.systems.common.SystemType.AzureML"]], "azuremlsystem (class in olive.systems.azureml)": [[7, "olive.systems.azureml.AzureMLSystem"]], "azurend12ssystem (class in olive.systems.system_alias)": [[7, "olive.systems.system_alias.AzureND12SSystem"]], "azurend24rssystem (class in olive.systems.system_alias)": [[7, "olive.systems.system_alias.AzureND24RSSystem"]], "azurend24ssystem (class in olive.systems.system_alias)": [[7, "olive.systems.system_alias.AzureND24SSystem"]], "azurend6ssystem (class in olive.systems.system_alias)": [[7, "olive.systems.system_alias.AzureND6SSystem"]], "azurend96a100system (class in olive.systems.system_alias)": [[7, "olive.systems.system_alias.AzureND96A100System"]], "azurend96asystem (class in olive.systems.system_alias)": [[7, "olive.systems.system_alias.AzureND96ASystem"]], "azurendv2system (class in olive.systems.system_alias)": [[7, "olive.systems.system_alias.AzureNDV2System"]], "docker (olive.systems.common.systemtype attribute)": [[7, "olive.systems.common.SystemType.Docker"]], "dockersystem (class in olive.systems.docker)": [[7, "olive.systems.docker.DockerSystem"]], "local (olive.systems.common.systemtype attribute)": [[7, "olive.systems.common.SystemType.Local"]], "localsystem (class in olive.systems.local)": [[7, "olive.systems.local.LocalSystem"]], "pythonenvironment (olive.systems.common.systemtype attribute)": [[7, "olive.systems.common.SystemType.PythonEnvironment"]], "pythonenvironmentsystem (class in olive.systems.python_environment)": [[7, "olive.systems.python_environment.PythonEnvironmentSystem"]], "surfaceprosystem1796 (class in olive.systems.system_alias)": [[7, "olive.systems.system_alias.SurfaceProSystem1796"]], "surfaceprosystem1807 (class in olive.systems.system_alias)": [[7, "olive.systems.system_alias.SurfaceProSystem1807"]], "systemtype (class in olive.systems.common)": [[7, "olive.systems.common.SystemType"]], "accelerators (olive.systems.system_alias.azurend12ssystem attribute)": [[7, "olive.systems.system_alias.AzureND12SSystem.accelerators"]], "accelerators (olive.systems.system_alias.azurend24rssystem attribute)": [[7, "olive.systems.system_alias.AzureND24RSSystem.accelerators"]], "accelerators (olive.systems.system_alias.azurend24ssystem attribute)": [[7, "olive.systems.system_alias.AzureND24SSystem.accelerators"]], "accelerators (olive.systems.system_alias.azurend6ssystem attribute)": [[7, "olive.systems.system_alias.AzureND6SSystem.accelerators"]], "accelerators (olive.systems.system_alias.azurend96a100system attribute)": [[7, "olive.systems.system_alias.AzureND96A100System.accelerators"]], "accelerators (olive.systems.system_alias.azurend96asystem attribute)": [[7, "olive.systems.system_alias.AzureND96ASystem.accelerators"]], "accelerators (olive.systems.system_alias.azurendv2system attribute)": [[7, "olive.systems.system_alias.AzureNDV2System.accelerators"]], "accelerators (olive.systems.system_alias.surfaceprosystem1796 attribute)": [[7, "olive.systems.system_alias.SurfaceProSystem1796.accelerators"]], "accelerators (olive.systems.system_alias.surfaceprosystem1807 attribute)": [[7, "olive.systems.system_alias.SurfaceProSystem1807.accelerators"]], "accelerators (olive.systems.system_config.localtargetuserconfig attribute)": [[7, "olive.systems.system_config.LocalTargetUserConfig.accelerators"]], "aml_compute (olive.systems.system_config.azuremltargetuserconfig attribute)": [[7, "olive.systems.system_config.AzureMLTargetUserConfig.aml_compute"]], "aml_docker_config (olive.systems.system_config.azuremltargetuserconfig attribute)": [[7, "olive.systems.system_config.AzureMLTargetUserConfig.aml_docker_config"]], "azureml_client_config (olive.systems.system_config.azuremltargetuserconfig attribute)": [[7, "olive.systems.system_config.AzureMLTargetUserConfig.azureml_client_config"]], "base_image (olive.systems.azureml.azuremldockerconfig attribute)": [[7, "olive.systems.azureml.AzureMLDockerConfig.base_image"]], "base_image (olive.systems.docker.localdockerconfig attribute)": [[7, "olive.systems.docker.LocalDockerConfig.base_image"]], "build_args (olive.systems.docker.localdockerconfig attribute)": [[7, "olive.systems.docker.LocalDockerConfig.build_args"]], "build_context_path (olive.systems.azureml.azuremldockerconfig attribute)": [[7, "olive.systems.azureml.AzureMLDockerConfig.build_context_path"]], "build_context_path (olive.systems.docker.localdockerconfig attribute)": [[7, "olive.systems.docker.LocalDockerConfig.build_context_path"]], "conda_file_path (olive.systems.azureml.azuremldockerconfig attribute)": [[7, "olive.systems.azureml.AzureMLDockerConfig.conda_file_path"]], "config (olive.systems.system_config.systemconfig attribute)": [[7, "olive.systems.system_config.SystemConfig.config"]], "create_system() (olive.systems.system_config.systemconfig method)": [[7, "olive.systems.system_config.SystemConfig.create_system"]], "dockerfile (olive.systems.azureml.azuremldockerconfig attribute)": [[7, "olive.systems.azureml.AzureMLDockerConfig.dockerfile"]], "dockerfile (olive.systems.docker.localdockerconfig attribute)": [[7, "olive.systems.docker.LocalDockerConfig.dockerfile"]], "environment_variables (olive.systems.system_config.pythonenvironmenttargetuserconfig attribute)": [[7, "olive.systems.system_config.PythonEnvironmentTargetUserConfig.environment_variables"]], "image_name (olive.systems.docker.localdockerconfig attribute)": [[7, "olive.systems.docker.LocalDockerConfig.image_name"]], "instance_count (olive.systems.system_config.azuremltargetuserconfig attribute)": [[7, "olive.systems.system_config.AzureMLTargetUserConfig.instance_count"]], "is_dev (olive.systems.system_config.azuremltargetuserconfig attribute)": [[7, "olive.systems.system_config.AzureMLTargetUserConfig.is_dev"]], "is_dev (olive.systems.system_config.dockertargetuserconfig attribute)": [[7, "olive.systems.system_config.DockerTargetUserConfig.is_dev"]], "local_docker_config (olive.systems.system_config.dockertargetuserconfig attribute)": [[7, "olive.systems.system_config.DockerTargetUserConfig.local_docker_config"]], "module": [[7, "module-olive.systems.system_alias"]], "num_cpus (olive.systems.system_alias.azurend12ssystem attribute)": [[7, "olive.systems.system_alias.AzureND12SSystem.num_cpus"]], "num_cpus (olive.systems.system_alias.azurend24rssystem attribute)": [[7, "olive.systems.system_alias.AzureND24RSSystem.num_cpus"]], "num_cpus (olive.systems.system_alias.azurend24ssystem attribute)": [[7, "olive.systems.system_alias.AzureND24SSystem.num_cpus"]], "num_cpus (olive.systems.system_alias.azurend6ssystem attribute)": [[7, "olive.systems.system_alias.AzureND6SSystem.num_cpus"]], "num_cpus (olive.systems.system_alias.azurend96a100system attribute)": [[7, "olive.systems.system_alias.AzureND96A100System.num_cpus"]], "num_cpus (olive.systems.system_alias.azurend96asystem attribute)": [[7, "olive.systems.system_alias.AzureND96ASystem.num_cpus"]], "num_cpus (olive.systems.system_alias.azurendv2system attribute)": [[7, "olive.systems.system_alias.AzureNDV2System.num_cpus"]], "num_gpus (olive.systems.system_alias.azurend12ssystem attribute)": [[7, "olive.systems.system_alias.AzureND12SSystem.num_gpus"]], "num_gpus (olive.systems.system_alias.azurend24rssystem attribute)": [[7, "olive.systems.system_alias.AzureND24RSSystem.num_gpus"]], "num_gpus (olive.systems.system_alias.azurend24ssystem attribute)": [[7, "olive.systems.system_alias.AzureND24SSystem.num_gpus"]], "num_gpus (olive.systems.system_alias.azurend6ssystem attribute)": [[7, "olive.systems.system_alias.AzureND6SSystem.num_gpus"]], "num_gpus (olive.systems.system_alias.azurend96a100system attribute)": [[7, "olive.systems.system_alias.AzureND96A100System.num_gpus"]], "num_gpus (olive.systems.system_alias.azurend96asystem attribute)": [[7, "olive.systems.system_alias.AzureND96ASystem.num_gpus"]], "num_gpus (olive.systems.system_alias.azurendv2system attribute)": [[7, "olive.systems.system_alias.AzureNDV2System.num_gpus"]], "olive.systems.system_alias": [[7, "module-olive.systems.system_alias"]], "olive_managed_env (olive.systems.system_config.azuremltargetuserconfig attribute)": [[7, "olive.systems.system_config.AzureMLTargetUserConfig.olive_managed_env"]], "olive_managed_env (olive.systems.system_config.dockertargetuserconfig attribute)": [[7, "olive.systems.system_config.DockerTargetUserConfig.olive_managed_env"]], "olive_managed_env (olive.systems.system_config.pythonenvironmenttargetuserconfig attribute)": [[7, "olive.systems.system_config.PythonEnvironmentTargetUserConfig.olive_managed_env"]], "prepend_to_path (olive.systems.system_config.pythonenvironmenttargetuserconfig attribute)": [[7, "olive.systems.system_config.PythonEnvironmentTargetUserConfig.prepend_to_path"]], "python_environment_path (olive.systems.system_config.pythonenvironmenttargetuserconfig attribute)": [[7, "olive.systems.system_config.PythonEnvironmentTargetUserConfig.python_environment_path"]], "requirements_file (olive.systems.system_config.azuremltargetuserconfig attribute)": [[7, "olive.systems.system_config.AzureMLTargetUserConfig.requirements_file"]], "requirements_file (olive.systems.system_config.dockertargetuserconfig attribute)": [[7, "olive.systems.system_config.DockerTargetUserConfig.requirements_file"]], "requirements_file (olive.systems.system_config.pythonenvironmenttargetuserconfig attribute)": [[7, "olive.systems.system_config.PythonEnvironmentTargetUserConfig.requirements_file"]], "requirements_file_path (olive.systems.docker.localdockerconfig attribute)": [[7, "olive.systems.docker.LocalDockerConfig.requirements_file_path"]], "resources (olive.systems.system_config.azuremltargetuserconfig attribute)": [[7, "olive.systems.system_config.AzureMLTargetUserConfig.resources"]], "run_params (olive.systems.docker.localdockerconfig attribute)": [[7, "olive.systems.docker.LocalDockerConfig.run_params"]], "sku (olive.systems.system_alias.azurend12ssystem attribute)": [[7, "olive.systems.system_alias.AzureND12SSystem.sku"]], "sku (olive.systems.system_alias.azurend24rssystem attribute)": [[7, "olive.systems.system_alias.AzureND24RSSystem.sku"]], "sku (olive.systems.system_alias.azurend24ssystem attribute)": [[7, "olive.systems.system_alias.AzureND24SSystem.sku"]], "sku (olive.systems.system_alias.azurend6ssystem attribute)": [[7, "olive.systems.system_alias.AzureND6SSystem.sku"]], "sku (olive.systems.system_alias.azurend96a100system attribute)": [[7, "olive.systems.system_alias.AzureND96A100System.sku"]], "sku (olive.systems.system_alias.azurend96asystem attribute)": [[7, "olive.systems.system_alias.AzureND96ASystem.sku"]], "sku (olive.systems.system_alias.azurendv2system attribute)": [[7, "olive.systems.system_alias.AzureNDV2System.sku"]], "sku (olive.systems.system_alias.surfaceprosystem1796 attribute)": [[7, "olive.systems.system_alias.SurfaceProSystem1796.sku"]], "sku (olive.systems.system_alias.surfaceprosystem1807 attribute)": [[7, "olive.systems.system_alias.SurfaceProSystem1807.sku"]], "system_type (olive.systems.system_alias.azurend12ssystem attribute)": [[7, "olive.systems.system_alias.AzureND12SSystem.system_type"]], "system_type (olive.systems.system_alias.azurend24rssystem attribute)": [[7, "olive.systems.system_alias.AzureND24RSSystem.system_type"]], "system_type (olive.systems.system_alias.azurend24ssystem attribute)": [[7, "olive.systems.system_alias.AzureND24SSystem.system_type"]], "system_type (olive.systems.system_alias.azurend6ssystem attribute)": [[7, "olive.systems.system_alias.AzureND6SSystem.system_type"]], "system_type (olive.systems.system_alias.azurend96a100system attribute)": [[7, "olive.systems.system_alias.AzureND96A100System.system_type"]], "system_type (olive.systems.system_alias.azurend96asystem attribute)": [[7, "olive.systems.system_alias.AzureND96ASystem.system_type"]], "system_type (olive.systems.system_alias.azurendv2system attribute)": [[7, "olive.systems.system_alias.AzureNDV2System.system_type"]], "system_type (olive.systems.system_alias.surfaceprosystem1796 attribute)": [[7, "olive.systems.system_alias.SurfaceProSystem1796.system_type"]], "system_type (olive.systems.system_alias.surfaceprosystem1807 attribute)": [[7, "olive.systems.system_alias.SurfaceProSystem1807.system_type"]], "type (olive.systems.system_config.systemconfig attribute)": [[7, "olive.systems.system_config.SystemConfig.type"]]}})
\ No newline at end of file
diff --git a/tutorials/configure_metrics.html b/tutorials/configure_metrics.html
index 3ee6e9829..ecb601f77 100644
--- a/tutorials/configure_metrics.html
+++ b/tutorials/configure_metrics.html
@@ -153,8 +153,8 @@ <h3>Accuracy Metric<a class="headerlink" href="#accuracy-metric" title="Permalin
 <span class="w">    </span><span class="nt">&quot;type&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;accuracy&quot;</span><span class="p">,</span>
 <span class="w">    </span><span class="nt">&quot;sub_types&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span>
 <span class="w">        </span><span class="p">{</span><span class="nt">&quot;name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;accuracy_score&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;priority&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">1</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;goal&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span><span class="nt">&quot;type&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;max-degradation&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;value&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">0.01</span><span class="p">}},</span>
-<span class="w">        </span><span class="p">{</span><span class="nt">&quot;name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;f1_score&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;metric_config&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span><span class="nt">&quot;multiclass&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">false</span><span class="p">}},</span>
-<span class="w">        </span><span class="p">{</span><span class="nt">&quot;name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;auroc&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;metric_config&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span><span class="nt">&quot;num_classes&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">2</span><span class="p">}}</span>
+<span class="w">        </span><span class="p">{</span><span class="nt">&quot;name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;f1_score&quot;</span><span class="p">},</span>
+<span class="w">        </span><span class="p">{</span><span class="nt">&quot;name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;auroc&quot;</span><span class="p">}</span>
 <span class="w">    </span><span class="p">],</span>
 <span class="w">    </span><span class="nt">&quot;user_config&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span>
 <span class="w">        </span><span class="nt">&quot;post_processing_func&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;post_process&quot;</span><span class="p">,</span>
@@ -341,8 +341,8 @@ <h2>Multi Metrics configuration<a class="headerlink" href="#multi-metrics-config
             <span class="s2">&quot;type&quot;</span><span class="p">:</span> <span class="s2">&quot;accuracy&quot;</span><span class="p">,</span>
             <span class="s2">&quot;sub_types&quot;</span><span class="p">:</span> <span class="p">[</span>
                 <span class="p">{</span><span class="s2">&quot;name&quot;</span><span class="p">:</span> <span class="s2">&quot;accuracy_score&quot;</span><span class="p">,</span> <span class="s2">&quot;priority&quot;</span><span class="p">:</span> <span class="mi">1</span><span class="p">,</span> <span class="s2">&quot;goal&quot;</span><span class="p">:</span> <span class="p">{</span><span class="s2">&quot;type&quot;</span><span class="p">:</span> <span class="s2">&quot;max-degradation&quot;</span><span class="p">,</span> <span class="s2">&quot;value&quot;</span><span class="p">:</span> <span class="mf">0.01</span><span class="p">}},</span>
-                <span class="p">{</span><span class="s2">&quot;name&quot;</span><span class="p">:</span> <span class="s2">&quot;f1_score&quot;</span><span class="p">,</span> <span class="s2">&quot;metric_config&quot;</span><span class="p">:</span> <span class="p">{</span><span class="s2">&quot;multiclass&quot;</span><span class="p">:</span> <span class="n">false</span><span class="p">}},</span>
-                <span class="p">{</span><span class="s2">&quot;name&quot;</span><span class="p">:</span> <span class="s2">&quot;auroc&quot;</span><span class="p">,</span> <span class="s2">&quot;metric_config&quot;</span><span class="p">:</span> <span class="p">{</span><span class="s2">&quot;num_classes&quot;</span><span class="p">:</span> <span class="mi">2</span><span class="p">}}</span>
+                <span class="p">{</span><span class="s2">&quot;name&quot;</span><span class="p">:</span> <span class="s2">&quot;f1_score&quot;</span><span class="p">},</span>
+                <span class="p">{</span><span class="s2">&quot;name&quot;</span><span class="p">:</span> <span class="s2">&quot;auroc&quot;</span><span class="p">}</span>
             <span class="p">]</span>
         <span class="p">},</span>
         <span class="p">{</span>