intel
diff --git a/‎neural_coder/__init__.py‎
Lines changed: 3 additions & 1 deletion b/‎neural_coder/__init__.py‎
Lines changed: 3 additions & 1 deletion
diff --git a/‎neural_coder/coders/pytorch/neural_compressor/__init__.py‎ renamed to ‎neural_coder/backends/__init__.py‎
Lines changed: 0 additions & 2 deletions b/‎neural_coder/coders/pytorch/neural_compressor/__init__.py‎ renamed to ‎neural_coder/backends/__init__.py‎
Lines changed: 0 additions & 2 deletions
diff --git a/‎neural_coder/backends/pytorch_aliblade.yaml‎
Lines changed: 25 additions & 0 deletions b/‎neural_coder/backends/pytorch_aliblade.yaml‎
Lines changed: 25 additions & 0 deletions
diff --git a/‎neural_coder/backends/pytorch_benchmark.yaml‎
Lines changed: 59 additions & 0 deletions b/‎neural_coder/backends/pytorch_benchmark.yaml‎
Lines changed: 59 additions & 0 deletions
diff --git a/‎neural_coder/backends/pytorch_channels_last.yaml‎
Lines changed: 37 additions & 0 deletions b/‎neural_coder/backends/pytorch_channels_last.yaml‎
Lines changed: 37 additions & 0 deletions
diff --git a/‎neural_coder/backends/pytorch_inc_bf16.yaml‎
Lines changed: 32 additions & 0 deletions b/‎neural_coder/backends/pytorch_inc_bf16.yaml‎
Lines changed: 32 additions & 0 deletions
diff --git a/‎neural_coder/backends/pytorch_inc_dynamic_quant.yaml‎
Lines changed: 38 additions & 0 deletions b/‎neural_coder/backends/pytorch_inc_dynamic_quant.yaml‎
Lines changed: 38 additions & 0 deletions
diff --git a/‎neural_coder/backends/pytorch_inc_static_quant_fx.yaml‎
Lines changed: 41 additions & 0 deletions b/‎neural_coder/backends/pytorch_inc_static_quant_fx.yaml‎
Lines changed: 41 additions & 0 deletions
diff --git a/‎neural_coder/backends/pytorch_inc_static_quant_ipex.yaml‎
Lines changed: 41 additions & 0 deletions b/‎neural_coder/backends/pytorch_inc_static_quant_ipex.yaml‎
Lines changed: 41 additions & 0 deletions
diff --git a/‎neural_coder/backends/pytorch_ipex_bf16.yaml‎
Lines changed: 42 additions & 0 deletions b/‎neural_coder/backends/pytorch_ipex_bf16.yaml‎
Lines changed: 42 additions & 0 deletions
@@ -14,4 +14,6 @@
 
 from .interface import enable
 from .interface import bench
-from .interface import superbench
+from .interface import superbench
+# from .interface import superreport
+from .interface import auto_quant
@@ -11,5 +11,3 @@
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
-
-
@@ -0,0 +1,25 @@
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+transformation:
+  location:
+    - ["insert_below_model_definition_line", "insert_below_input_definition_line"]
+  content:
+    - |-
+      [+] import torch_blade
+      [+] with torch.no_grad():
+      [+]     MODEL_NAME = torch_blade.optimize(MODEL_NAME, allow_tracing=True, model_inputs=tuple(INPUT_NAME))
+  order:
+    - below:
+      above:
@@ -0,0 +1,59 @@
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+transformation:
+  location:
+    - insert_above_inference_line
+    - insert_below_inference_line
+    - indent_inference_line
+  content:
+    - |-
+      [+] if not ACCURACY_MODE:
+      [+]     import time
+      [+]     count_iter_ = 0
+      [+]     total_time_ = 0
+      [+]     num_iter_ = NUM_BENCHMARK_ITERATION
+      [+]     num_warmup_iter_ = 3
+      [+]     list_batch_time_ = []
+      [+]     for i_ in range(num_iter_):
+      [+]         count_iter_ = count_iter_ + 1
+      [+]         if count_iter_ > num_warmup_iter_:
+      [+]             t1_ = time.time()
+      [+]         with torch.no_grad():
+    - |-
+      [+]         if count_iter_ > num_warmup_iter_:
+      [+]             t2_ = time.time()
+      [+]             batch_time_ = t2_ - t1_
+      [+]             list_batch_time_.append(batch_time_)
+      [+]             total_time_ = total_time_ + batch_time_
+      [+]     print("Neural_Coder_Bench_IPS: ", round((num_iter_ - num_warmup_iter_) / total_time_, 3))
+      [+]     print("Neural_Coder_Bench_MSPI: ", round(total_time_ / (num_iter_ - num_warmup_iter_) * 1000, 3))
+      [+]     list_batch_time_.sort()
+      [+]     p50_latency_ = list_batch_time_[int(len(list_batch_time_) * 0.50) - 1] * 1000
+      [+]     p90_latency_ = list_batch_time_[int(len(list_batch_time_) * 0.90) - 1] * 1000
+      [+]     p99_latency_ = list_batch_time_[int(len(list_batch_time_) * 0.99) - 1] * 1000
+      [+]     print("Neural_Coder_Bench_P50: ", round(p50_latency_, 3))
+      [+]     print("Neural_Coder_Bench_P90: ", round(p90_latency_, 3))
+      [+]     print("Neural_Coder_Bench_P99: ", round(p99_latency_, 3))
+      [+]     quit()
+      [+] else:
+      [+]     INFERENCE_LINE
+    - 3
+  order:
+    - below:
+      above:
+    - below:
+      above:
+    - below:
+      above:
@@ -0,0 +1,37 @@
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+transformation:
+  location:
+    - insert_below_model_definition_line
+  content:
+    - |-
+      [+] import torch
+      [+] with torch.no_grad():
+      [+]     MODEL_NAME.eval()
+      [+]     MODEL_NAME = MODEL_NAME.to(memory_format=torch.channels_last)
+  order:
+    - below:
+        - pytorch_inc_static_quant_fx
+        - pytorch_inc_static_quant_ipex
+        - pytorch_inc_dynamic_quant
+      above:
+        - pytorch_ipex_fp32
+        - pytorch_ipex_bf16
+        - pytorch_ipex_int8_static_quant
+        - pytorch_ipex_int8_dynamic_quant
+        - pytorch_jit_script
+        - pytorch_jit_script_ofi
+        - pytorch_jit_trace
+        - pytorch_jit_trace_ofi
@@ -0,0 +1,32 @@
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+transformation:
+  location:
+    - insert_below_model_definition_line
+  content:
+    - |-
+      [+] from neural_compressor.experimental import MixedPrecision
+      [+] converter = MixedPrecision()
+      [+] converter.precisions = 'bf16'
+      [+] converter.model = MODEL_NAME
+      [+] MODEL_NAME = converter()
+  order:
+    - below:
+      above:
+        - pytorch_jit_script
+        - pytorch_jit_script_ofi
+        - pytorch_jit_trace
+        - pytorch_jit_trace_ofi
+        - pytorch_channels_last
@@ -0,0 +1,38 @@
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+transformation:
+  location:
+    - insert_below_model_definition_line
+  content:
+    - |-
+      [+] if "GraphModule" not in str(type(MODEL_NAME)):
+      [+]     from neural_compressor.conf.config import QuantConf
+      [+]     from neural_compressor.experimental import Quantization, common
+      [+]     quant_config = QuantConf()
+      [+]     quant_config.usr_cfg.quantization.approach = "post_training_dynamic_quant"
+      [+]     quant_config.usr_cfg.model.framework = "pytorch"
+      [+]     quantizer = Quantization(quant_config)
+      [+]     quantizer.model = common.Model(MODEL_NAME)
+      [+]     MODEL_NAME = quantizer()
+      [+]     MODEL_NAME = MODEL_NAME.model
+      [+]     MODEL_NAME.eval()
+  order:
+    - below:
+      above:
+        - pytorch_jit_script
+        - pytorch_jit_script_ofi
+        - pytorch_jit_trace
+        - pytorch_jit_trace_ofi
+        - pytorch_channels_last
@@ -0,0 +1,41 @@
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+transformation:
+  location:
+    - ["insert_below_dataloader_definition_line", "insert_below_model_definition_line", "insert_below_input_definition_line"]
+  content:
+    - |-
+      [+] if "GraphModule" not in str(type(MODEL_NAME)):
+      [+]     def eval_func(model):
+      [+]         EVAL_FUNC_LINES
+      [+]     from neural_compressor.conf.config import QuantConf
+      [+]     from neural_compressor.experimental import Quantization, common
+      [+]     quant_config = QuantConf()
+      [+]     quant_config.usr_cfg.model.framework = "pytorch_fx"
+      [+]     quantizer = Quantization(quant_config)
+      [+]     quantizer.model = common.Model(MODEL_NAME)
+      [+]     quantizer.calib_dataloader = DATALOADER_NAME
+      [+]     quantizer.eval_func = eval_func
+      [+]     MODEL_NAME = quantizer()
+      [+]     MODEL_NAME = MODEL_NAME.model
+      [+]     MODEL_NAME.eval()
+  order:
+    - below:
+      above:
+        - pytorch_jit_script
+        - pytorch_jit_script_ofi
+        - pytorch_jit_trace
+        - pytorch_jit_trace_ofi
+        - pytorch_channels_last
@@ -0,0 +1,41 @@
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+transformation:
+  location:
+    - ["insert_below_dataloader_definition_line", "insert_below_model_definition_line", "insert_below_input_definition_line"]
+  content:
+    - |-
+      [+] if "GraphModule" not in str(type(MODEL_NAME)):
+      [+]     def eval_func(model):
+      [+]         EVAL_FUNC_LINES
+      [+]     from neural_compressor.conf.config import QuantConf
+      [+]     from neural_compressor.experimental import Quantization, common
+      [+]     quant_config = QuantConf()
+      [+]     quant_config.usr_cfg.model.framework = "pytorch_ipex"
+      [+]     quantizer = Quantization(quant_config)
+      [+]     quantizer.model = common.Model(MODEL_NAME)
+      [+]     quantizer.calib_dataloader = DATALOADER_NAME
+      [+]     quantizer.eval_func = eval_func
+      [+]     MODEL_NAME = quantizer()
+      [+]     MODEL_NAME = MODEL_NAME.model
+      [+]     MODEL_NAME.eval()
+  order:
+    - below:
+      above:
+        - pytorch_jit_script
+        - pytorch_jit_script_ofi
+        - pytorch_jit_trace
+        - pytorch_jit_trace_ofi
+        - pytorch_channels_last
@@ -0,0 +1,42 @@
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+transformation:
+  location:
+    - insert_below_model_definition_line
+    - insert_above_inference_line
+    - indent_inference_line
+  content:
+    - |-
+      [+] import torch
+      [+] import intel_extension_for_pytorch as ipex
+      [+] with torch.no_grad():
+      [+]     MODEL_NAME.eval()
+      [+]     MODEL_NAME = ipex.optimize(MODEL_NAME, dtype=torch.bfloat16)
+    - |-
+      [+] import torch
+      [+] with torch.cpu.amp.autocast(enabled=True, dtype=torch.bfloat16):
+    - 1
+  order:
+    - below:
+        - pytorch_channels_last
+      above:
+        - pytorch_jit_script
+        - pytorch_jit_script_ofi
+        - pytorch_jit_trace
+        - pytorch_jit_trace_ofi
+    - below:
+      above:
+    - below:
+      above: