apache
diff --git a/‎tests/python/mkl/subgraphs/subgraph_common.py‎
Lines changed: 218 additions & 0 deletions b/‎tests/python/mkl/subgraphs/subgraph_common.py‎
Lines changed: 218 additions & 0 deletions
@@ -0,0 +1,218 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+import mxnet as mx
+import numpy as np
+import unittest
+import pytest
+import ctypes
+import copy
+
+
+from mxnet.contrib import quantization
+from mxnet.gluon import nn
+from mxnet.test_utils import assert_almost_equal, assert_almost_equal_with_err
+
+OP_NAME='op_name'
+QUANTIZED_OP_NAME='quantized_op_name'
+SG_PASS_NAME='MKLDNN'
+QUANTIZE_SG_PASS_NAME='MKLDNN_QUANTIZE'
+config =  {
+  'conv': {
+    OP_NAME: 'sg_mkldnn_conv',
+    QUANTIZED_OP_NAME: 'quantized_sg_mkldnn_conv'
+  },
+  'fc': {
+    OP_NAME: 'sg_mkldnn_fully_connected',
+    QUANTIZED_OP_NAME: 'quantized_sg_mkldnn_fully_connected'
+  }
+}
+
+DATA_SHAPE=[(64, 4, 10, 10), (4, 3, 24, 24), (1, 16, 32, 32)]
+
+# Helpers
+class RELU6(nn.HybridBlock):
+    """Relu6 used in MobileNetV2."""
+
+    def __init__(self, **kwargs):
+        super(RELU6, self).__init__(**kwargs)
+
+    def hybrid_forward(self, F, x):
+        return F.clip(x, 0, 6, name="relu6")
+
+class TailNegBlock(nn.HybridBlock):
+  def __init__(self, **kwargs):
+    super(TailNegBlock, self).__init__(**kwargs)
+    self.fc1 = nn.Dense(10, flatten=True)
+    self.fc2 = nn.Dense(10, flatten=True)
+
+  def hybrid_forward(self, F, x1, x2):
+    out_fc1 = self.fc1(x1)
+    out_fc2 = self.fc2(x2)
+    out = F.concat(out_fc1, out_fc2)
+    out = F.softmax(out)
+    return out
+
+class CustomNormalInit(mx.init.Initializer):
+    """Initializes weights with random values sampled from a normal distribution
+    with a custom mean and standard deviation of `sigma`.
+    """
+    def __init__(self, mean=0, sigma=0.01):
+        super(CustomNormalInit, self).__init__(mean=mean, sigma=sigma)
+        self.mean = mean
+        self.sigma = sigma
+
+    def _init_weight(self, _, arr):
+        mx.random.normal(self.mean, self.sigma, arr.shape, dtype=arr.dtype, out=arr)
+
+
+def check_qsym_calibrated(qsym, out_type, name='conv'):
+  quantized_op_name = 'quantized_' + name
+  assert ''.join(qsym.attr_dict().keys()).find(quantized_op_name) != -1
+  for k, v in qsym.attr_dict().items():
+    if k.find('_quantize') != -1:
+      assert v['out_type'] == out_type
+    if k.find(quantized_op_name) != -1:
+      if quantized_op_name.startswith("quantized_sg_mkldnn_fully_connected") and 'enable_float_output' in v:
+        continue
+      assert 'min_calib_range' in v
+      assert 'max_calib_range' in v
+
+def check_qsym_scale_align(qsym):
+  assert ''.join(qsym.attr_dict().keys()).find('quantized_sg_mkldnn_conv') != -1
+  init = False
+  for k, v in qsym.attr_dict().items():
+    if k.find('quantized_sg_mkldnn_conv') != -1:
+      assert 'min_calib_range' in v
+      assert 'max_calib_range' in v
+      if not init:
+        min_calib_range = v['min_calib_range']
+        max_calib_range = v['max_calib_range']
+        init = True
+      else:
+        assert min_calib_range == v['min_calib_range']
+        assert max_calib_range == v['max_calib_range']
+
+
+def check_quantize(net_original, data_shape, out_type, name='conv',
+                   check_calibration=True, check_scale_align=False):
+  quantize_granularity_list = ['tensor-wise']
+  if name == 'fc':
+    quantize_granularity_list += ['channel-wise']
+
+  if name in config:
+    name = config[name][OP_NAME]
+
+  net_original.initialize(init=mx.init.Normal(0.5), force_reinit=True)
+  min_value = -1 if out_type != 'uint8' else 0
+  data = mx.random.uniform(min_value, 1.0, shape=data_shape, dtype='float32', ctx=mx.current_context())
+
+  outputs = net_original(data)
+  for output in outputs:
+      output.wait_to_read()
+  ref_out = outputs
+
+  calib_data = mx.gluon.data.DataLoader(data, batch_size=1)
+  for quantize_granularity in quantize_granularity_list:
+    qnet = quantization.quantize_net(net_original,
+                                     ctx=mx.current_context(),
+                                     exclude_layers=None,
+                                     exclude_operators=None,
+                                     quantized_dtype=out_type,
+                                     calib_mode='naive',
+                                     calib_data=calib_data,
+                                     num_calib_batches=1,
+                                     quantize_mode='full',
+                                     quantize_granularity=quantize_granularity)
+    qsym, _ = qnet.export(None)
+    if check_calibration:
+      check_qsym_calibrated(qsym, out_type, name=name)
+    if check_scale_align:
+      check_qsym_scale_align(qsym)
+
+    quantized_out = qnet(data)
+    for i in range(len(ref_out)):
+      min_range = mx.nd.min(ref_out[i]).asscalar()
+      max_range = mx.nd.max(ref_out[i]).asscalar()
+      atol = 0.1 * max(abs(min_range), abs(max_range))
+      assert_almost_equal_with_err(quantized_out.asnumpy(), ref_out.asnumpy(), rtol=0.1, atol=atol, etol=0.2)
+
+
+def check_fusion(net_original, data_shape, attrs_dict, check_fp32_fusion=True, check_quantization=True,
+                 out_types=['uint8', 'int8', 'auto'], dedup_subgraph=True):
+  net_original.initialize()
+  net_original.hybridize(static_alloc=False, static_shape=False)
+  data = mx.random.uniform(shape=data_shape, dtype='float32', ctx=mx.current_context())
+  net_original(data)
+  net_fusion = copy.copy(net_original)
+  sym, params = net_original.export(None)
+
+  if check_fp32_fusion:
+    data_min = -1.0
+    data_max = 1.0
+    if ''.join(sym.get_internals().list_outputs()).find('sqrt') != -1:
+      check_quantization = False
+      data_min = 0
+
+    sym_sg = sym.optimize_for(SG_PASS_NAME, dedup_subgraph=dedup_subgraph, skip_infer=True)
+    for name, attrs in attrs_dict.items():
+      if name in config:
+        op_name = config[name][OP_NAME]
+      else:
+        op_name = name
+      assert ''.join(sym_sg.get_internals().list_outputs()).find(op_name) != -1
+      if len(attrs):
+          found = False
+          for k, v in sym_sg.attr_dict().items():
+            if k.find(op_name) != -1:
+              found = True
+              for attr_name, attr_value in attrs.items():
+                assert v[attr_name].lower() == attr_value.lower()
+          assert found
+
+    data = mx.nd.random.uniform(shape=data_shape, low=data_min, high=data_max)
+    out_unfused = net_original(data)
+
+    net_fusion.optimize_for(data, backend=SG_PASS_NAME)
+    out_fused = net_fusion(data)
+
+    assert_almost_equal(out_unfused.asnumpy(), out_fused.asnumpy(), rtol=1e-3, atol=1e-1)
+
+  if check_quantization:
+    # fp32 to int8
+    for out_type in out_types:
+      check_quantize(net_original, data_shape, out_type, name=name)
+
+def check_neg_fusion(net_original, attrs_name=None, excluded_attrs=None,
+                     data_shapes=(4,4,10,10), name='conv'):
+  op_name = config[name][OP_NAME]
+
+  data_nd = mx.nd.random.uniform(shape=data_shapes)
+  net_original.initialize()
+  net_original.hybridize()
+  net_original(data_nd)
+
+  sym, _ = net_original.export(None)
+  sym_sg = sym.optimize_for(SG_PASS_NAME, dedup_subgraph=True, skip_infer=True)
+
+  attrs_dict = sym_sg.attr_dict()
+  for k, v in attrs_dict.items():
+    if k.find(op_name) != -1:
+      for attr in attrs_name:
+        assert v[attr] == 'true'
+      for exc_attr in excluded_attrs:
+        assert exc_attr not in v.keys()