pytorch/caffe2/python/ideep/elementwise_sum_op_test.py



import unittest
import hypothesis.strategies as st
from hypothesis import given
import numpy as np
from caffe2.proto import caffe2_pb2
from caffe2.python import core, workspace
import caffe2.python.hypothesis_test_util as hu
import caffe2.python.ideep_test_util as mu


@unittest.skipIf(not workspace.C.use_mkldnn, "No MKLDNN support.")
class ElementwiseSumTest(hu.HypothesisTestCase):
    @given(size=st.integers(7, 9),
           input_channels=st.integers(1, 3),
           batch_size=st.integers(1, 3),
           inputs=st.integers(2, 7),
           inplace=st.booleans(),
           **mu.gcs)
    def test_elementwise_sum(self,
                                 size,
                                 input_channels,
                                 batch_size,
                                 inputs,
                                 inplace,
                                 gc,
                                 dc):
        op = core.CreateOperator(
            "Sum",
            ["X_{}".format(i) for i in range(inputs)],
            ["X_0" if inplace else "Y"],
        )
        Xs = [np.random.rand(batch_size, input_channels, size, size).astype(
            np.float32) for _ in range(inputs)]
        self.assertDeviceChecks(dc, op, Xs, [0])


    @given(size=st.integers(7, 9),
           input_channels=st.integers(1, 3),
           batch_size=st.integers(1, 3),
           inputs=st.integers(2, 7),
           inplace=st.booleans(),
           **mu.gcs_cpu_ideep)
    def test_elementwise_sum_fallback(self,
                                      size,
                                      input_channels,
                                      batch_size,
                                      inputs,
                                      inplace,
                                      gc,
                                      dc):
        op = core.CreateOperator(
            "Sum",
            ["X_{}".format(i) for i in range(inputs)],
            ["X_0" if inplace else "Y"],
            device_option=dc[1]
        )
        Xs = [np.random.rand(batch_size, input_channels, size, size).astype(
            np.float32) for _ in range(inputs)]

        sum_val = Xs[0]
        workspace.FeedBlob("X_0", Xs[0], dc[0])
        for i, x in enumerate(Xs):
            if i == 0: continue
            sum_val += x
            workspace.FeedBlob("X_{}".format(i), x, dc[1])

        workspace.RunOperatorOnce(op)
        Y = workspace.FetchBlob("X_0" if inplace else "Y")

        if not np.allclose(sum_val, Y, atol=0.01, rtol=0.01):
            print(Y.flatten())
            print(sum_val.flatten())
            print(np.max(np.abs(Y - sum_val)))
            self.assertTrue(False)


    @given(size=st.integers(7, 9),
           input_channels=st.integers(1, 3),
           batch_size=st.integers(1, 3),
           inputs=st.integers(2, 7),
           inplace=st.booleans(),
           **mu.gcs_cpu_ideep)
    def test_int8_elementwise_sum(self,
                                 size,
                                 input_channels,
                                 batch_size,
                                 inputs,
                                 inplace,
                                 gc,
                                 dc):
        sum_fp32 = core.CreateOperator(
            "Sum",
            ["X_{}".format(i) for i in range(inputs)],
            ["X_0" if inplace else "Y"],
        )
        Xs = [np.random.rand(batch_size, input_channels, size, size).astype(
            np.float32) for _ in range(inputs)]

        old_ws_name = workspace.CurrentWorkspace()
        workspace.SwitchWorkspace("_device_check_", True)

        Xi_scales = []
        Xi_zero_points = []
        for i, X in enumerate(Xs):
            workspace.FeedBlob("X_{}".format(i), X, dc[0])
            if X.min() >= 0:
                Xi_scales.append(np.absolute(X).max() / 0xFF)
                Xi_zero_points.append(0)
            else:
                Xi_scales.append(np.absolute(X).max() / 0x7F)
                Xi_zero_points.append(128)

        workspace.RunOperatorOnce(sum_fp32)
        Y = workspace.FetchBlob("X_0" if inplace else "Y")

        if Y.min() >= 0:
            Y_scale = np.absolute(Y).max() / 0xFF
            Y_zero_point = 0
        else:
            Y_scale = np.absolute(Y).max() / 0x7F
            Y_zero_point = 128

        workspace.ResetWorkspace()

        net = caffe2_pb2.NetDef()
        for i, Xi in enumerate(Xs):
            workspace.FeedBlob("Xi_{}".format(i), Xi, dc[1])
            sw2nhwc = core.CreateOperator(
                "NCHW2NHWC",
                ["Xi_{}".format(i)],
                ["Xi_{}_nhwc".format(i)],
                device_option=dc[1]
            )
            quantize = core.CreateOperator(
                "Int8Quantize",
                ["Xi_{}_nhwc".format(i)],
                ["Xi_{}_quantized".format(i)],
                engine="DNNLOWP",
                device_option=dc[1],
                Y_zero_point=Xi_zero_points[i],
                Y_scale=Xi_scales[i],
            )
            net.op.extend([sw2nhwc, quantize])

        sum = core.CreateOperator(
            "Int8Sum",
            ["Xi_{}_quantized".format(i) for i in range(inputs)],
            ["Xi_0_quantized" if inplace else "Y_quantized"],
            engine="DNNLOWP",
            device_option=dc[1],
            Y_zero_point=Y_zero_point,
            Y_scale=Y_scale,
        )

        dequantize = core.CreateOperator(
            "Int8Dequantize",
            ["Xi_0_quantized" if inplace else "Y_quantized"],
            ["Y_nhwc"],
            engine="DNNLOWP",
            device_option=dc[1],
        )

        sw2nchw = core.CreateOperator(
            "NHWC2NCHW",
            ["Y_nhwc"],
            ["Y_out"],
            device_option=dc[1]
        )

        net.op.extend([sum, dequantize, sw2nchw])
        workspace.RunNetOnce(net)
        Y_out = workspace.FetchBlob("Y_out")

        MSE = np.square(np.subtract(Y, Y_out)).mean()
        if MSE > 0.005:
            print(Y.flatten())
            print(Y_out.flatten())
            print(np.max(np.abs(Y_out - Y)))
            print("MSE", MSE)
            self.assertTrue(False)

        workspace.SwitchWorkspace(old_ws_name)

if __name__ == "__main__":
    unittest.main()