CodeLinaro
diff --git a/‎google-bert-bert-base-multilingual-cased/QNN/README.md‎
Lines changed: 25 additions & 0 deletions b/‎google-bert-bert-base-multilingual-cased/QNN/README.md‎
Lines changed: 25 additions & 0 deletions
diff --git a/‎google-bert-bert-base-multilingual-cased/aitk/bert-base-multilingual-cased_qnn_gpu.json‎ renamed to ‎google-bert-bert-base-multilingual-cased/QNN/config_qnn_gpu.json‎
Lines changed: 17 additions & 41 deletions b/‎google-bert-bert-base-multilingual-cased/aitk/bert-base-multilingual-cased_qnn_gpu.json‎ renamed to ‎google-bert-bert-base-multilingual-cased/QNN/config_qnn_gpu.json‎
Lines changed: 17 additions & 41 deletions
diff --git a/‎google-bert-bert-base-multilingual-cased/QNN/info.yml‎
Lines changed: 7 additions & 0 deletions b/‎google-bert-bert-base-multilingual-cased/QNN/info.yml‎
Lines changed: 7 additions & 0 deletions
diff --git a/‎google-bert-bert-base-multilingual-cased/aitk/bert-base-multilingual-cased_qnn_gpu.json.config‎
Lines changed: 0 additions & 38 deletions b/‎google-bert-bert-base-multilingual-cased/aitk/bert-base-multilingual-cased_qnn_gpu.json.config‎
Lines changed: 0 additions & 38 deletions
diff --git a/‎google-bert-bert-base-multilingual-cased/aitk/info.yml‎
Lines changed: 0 additions & 3 deletions b/‎google-bert-bert-base-multilingual-cased/aitk/info.yml‎
Lines changed: 0 additions & 3 deletions
diff --git a/‎google-vit-base-patch16-224/QNN/README.md‎
Lines changed: 24 additions & 0 deletions b/‎google-vit-base-patch16-224/QNN/README.md‎
Lines changed: 24 additions & 0 deletions
diff --git a/‎google-vit-base-patch16-224/QNN/info.yml‎
Lines changed: 3 additions & 0 deletions b/‎google-vit-base-patch16-224/QNN/info.yml‎
Lines changed: 3 additions & 0 deletions
diff --git a/‎google-vit-base-patch16-224/QNN/vit_qnn_gpu.json‎
Lines changed: 55 additions & 0 deletions b/‎google-vit-base-patch16-224/QNN/vit_qnn_gpu.json‎
Lines changed: 55 additions & 0 deletions
diff --git a/‎google-vit-base-patch16-224/aitk/info.yml‎
Lines changed: 0 additions & 3 deletions b/‎google-vit-base-patch16-224/aitk/info.yml‎
Lines changed: 0 additions & 3 deletions
diff --git a/‎google-vit-base-patch16-224/aitk/vit-base-patch16-224_qnn_gpu.json‎
Lines changed: 0 additions & 95 deletions b/‎google-vit-base-patch16-224/aitk/vit-base-patch16-224_qnn_gpu.json‎
Lines changed: 0 additions & 95 deletions
@@ -0,0 +1,25 @@
+# Bert-base-multilingual-cased Model Optimization
+
+### QNN-GPU:
+
+Running QNN-GPU configs requires features and fixes that are not available in the released Olive version 0.9.3.
+To ensure compatibility, please install Olive directly from the source at the required commit:
+
+```bash
+pip install git+https://github.com/microsoft/Olive.git@da24463e14ed976503dc5871572b285bc5ddc4b2
+```
+
+If you previously installed Olive via PyPI or pinned it to version 0.9.3, please uninstall it first and then use the above
+commit to install:
+
+```bash
+pip uninstall olive-ai
+```
+
+To run the config:
+
+```bash
+olive run --config config_qnn_gpu.json
+```
+
+✅ Optimized model saved in: `output/`
@@ -46,50 +46,26 @@
             ]
         }
     },
-    "data_configs": [
-        {
-            "name": "quantization_data_config",
-            "type": "HuggingfaceContainer",
-            "load_dataset_config": {
-                "data_name": "facebook/xnli",
-                "subset": "en",
-                "split": "validation"
-            },
-            "pre_process_data_config": {
-                "input_cols": [
-                    "premise"
-                ],
-                "padding": "max_length",
-                "max_length": 128,
-                "max_samples": 10
-            },
-            "dataloader_config": {
-                "batch_size": 1
-            }
+    "passes": {
+        "conversion": {
+            "type": "OnnxConversion",
+            "target_opset": 20,
+            "save_as_external_data": false
         },
-        {
-            "name": "evaluation_data_config",
-            "type": "HuggingfaceContainer",
-            "load_dataset_config": {
-                "data_name": "facebook/xnli",
-                "subset": "en",
-                "split": "validation"
-            },
-            "pre_process_data_config": {
-                "input_cols": [
-                    "premise"
-                ],
-                "padding": "max_length",
-                "max_length": 128,
-                "max_samples": 10
-            },
-            "dataloader_config": {
-                "batch_size": 1
-            }
+        "surgery": {
+            "type": "GraphSurgeries",
+            "surgeries": [
+                {
+                    "surgeon": "ReplaceAttentionMaskValue"
+                },
+                {
+                    "surgeon": "MatMulAddToGemm"
+                }
+            ]
         }
-    ],
+    },
     "target": "target_system",
     "cache_dir": "cache",
-    "output_dir": "model/google_bert",
+    "output_dir": "output",
     "evaluate_input_model": false
 }
@@ -0,0 +1,7 @@
+keywords:
+    QNN
+arch: bert
+recipes:
+    - file: "config_qnn_gpu.json"
+      device: gpu
+      ep: QNNExecutionProvider
@@ -23,9 +23,6 @@ recipes:
     - file: "bert-base-multilingual-cased_migraphx.json"
       device: gpu
       ep: MIGraphXExecutionProvider
-    - file: "bert-base-multilingual-cased_qnn_gpu.json"
-      device: gpu
-      ep: QNNExecutionProvider
 aitk:
     modelInfo:
         id: "huggingface/google-bert/bert-base-multilingual-cased"
 
@@ -16,3 +16,27 @@ You can test output model with provided scripts. It is also a example you can re
 ```
 python .\val_tiny_imagenet.py
 ```
+
+### QNN-GPU:
+
+Running QNN-GPU configs requires features and fixes that are not available in the released Olive version 0.9.3.
+To ensure compatibility, please install Olive directly from the source at the required commit:
+
+```bash
+pip install git+https://github.com/microsoft/Olive.git@da24463e14ed976503dc5871572b285bc5ddc4b2
+```
+
+If you previously installed Olive via PyPI or pinned it to version 0.9.3, please uninstall it first and then use the above
+commit to install:
+
+```bash
+pip uninstall olive-ai
+```
+
+To run the config:
+
+```bash
+olive run --config vit_qnn_gpu.json
+```
+
+✅ Optimized model saved in: `output/`
@@ -5,3 +5,6 @@ recipes:
     - file: "vit_qnn_fp32_ctx.json"
       device: npu
       ep: QNNExecutionProvider
+    - file: "vit_qnn_gpu.json"
+      device: gpu
+      ep: QNNExecutionProvider
@@ -0,0 +1,55 @@
+{
+    "input_model": {
+        "type": "HfModel",
+        "model_path": "google/vit-base-patch16-224",
+        "task": "image-classification",
+        "io_config": {
+            "input_names": [
+                "pixel_values"
+            ],
+            "input_shapes": [
+                [
+                    1,
+                    3,
+                    224,
+                    224
+                ]
+            ],
+            "output_names": [
+                "logits"
+            ]
+        }
+    },
+    "systems": {
+        "target_system": {
+            "type": "LocalSystem",
+            "accelerators": [
+                {
+                    "device": "gpu",
+                    "execution_providers": [
+                        "QNNExecutionProvider"
+                    ]
+                }
+            ]
+        }
+    },
+    "passes": {
+        "conversion": {
+            "type": "OnnxConversion",
+            "target_opset": 20,
+            "save_as_external_data": false
+        },
+        "surgery": {
+            "type": "GraphSurgeries",
+            "surgeries": [
+                {
+                    "surgeon": "MatMulAddToGemm"
+                }
+            ]
+        }
+    },
+    "target": "target_system",
+    "output_dir": "output",
+    "evaluate_input_model": false,
+    "cache_dir": "cache"
+}
@@ -23,9 +23,6 @@ recipes:
     - file: "vit-base-patch16-224_migraphx.json"
       device: gpu
       ep: MIGraphXExecutionProvider
-    - file: "vit-base-patch16-224_qnn_gpu.json"
-      device: gpu
-      ep: QNNExecutionProvider
 aitk:
     modelInfo:
         id: "huggingface/google/vit-base-patch16-224"