thanks to vye16 ❤

fb5159d over 2 years ago

6.32 kB






	import unittest
	import hypothesis.strategies as st
	from hypothesis import given
	import numpy as np
	from caffe2.proto import caffe2_pb2
	from caffe2.python import core, workspace
	import caffe2.python.hypothesis_test_util as hu
	import caffe2.python.ideep_test_util as mu


	@unittest.skipIf(not workspace.C.use_mkldnn, "No MKLDNN support.")
	class ElementwiseSumTest(hu.HypothesisTestCase):
	@given(size=st.integers(7, 9),
	input_channels=st.integers(1, 3),
	batch_size=st.integers(1, 3),
	inputs=st.integers(2, 7),
	inplace=st.booleans(),
	**mu.gcs)
	def test_elementwise_sum(self,
	size,
	input_channels,
	batch_size,
	inputs,
	inplace,
	gc,
	dc):
	op = core.CreateOperator(
	"Sum",
	["X_{}".format(i) for i in range(inputs)],
	["X_0" if inplace else "Y"],
	)
	Xs = [np.random.rand(batch_size, input_channels, size, size).astype(
	np.float32) for _ in range(inputs)]
	self.assertDeviceChecks(dc, op, Xs, [0])


	@given(size=st.integers(7, 9),
	input_channels=st.integers(1, 3),
	batch_size=st.integers(1, 3),
	inputs=st.integers(2, 7),
	inplace=st.booleans(),
	**mu.gcs_cpu_ideep)
	def test_elementwise_sum_fallback(self,
	size,
	input_channels,
	batch_size,
	inputs,
	inplace,
	gc,
	dc):
	op = core.CreateOperator(
	"Sum",
	["X_{}".format(i) for i in range(inputs)],
	["X_0" if inplace else "Y"],
	device_option=dc[1]
	)
	Xs = [np.random.rand(batch_size, input_channels, size, size).astype(
	np.float32) for _ in range(inputs)]

	sum_val = Xs[0]
	workspace.FeedBlob("X_0", Xs[0], dc[0])
	for i, x in enumerate(Xs):
	if i == 0: continue
	sum_val += x
	workspace.FeedBlob("X_{}".format(i), x, dc[1])

	workspace.RunOperatorOnce(op)
	Y = workspace.FetchBlob("X_0" if inplace else "Y")

	if not np.allclose(sum_val, Y, atol=0.01, rtol=0.01):
	print(Y.flatten())
	print(sum_val.flatten())
	print(np.max(np.abs(Y - sum_val)))
	self.assertTrue(False)


	@given(size=st.integers(7, 9),
	input_channels=st.integers(1, 3),
	batch_size=st.integers(1, 3),
	inputs=st.integers(2, 7),
	inplace=st.booleans(),
	**mu.gcs_cpu_ideep)
	def test_int8_elementwise_sum(self,
	size,
	input_channels,
	batch_size,
	inputs,
	inplace,
	gc,
	dc):
	sum_fp32 = core.CreateOperator(
	"Sum",
	["X_{}".format(i) for i in range(inputs)],
	["X_0" if inplace else "Y"],
	)
	Xs = [np.random.rand(batch_size, input_channels, size, size).astype(
	np.float32) for _ in range(inputs)]

	old_ws_name = workspace.CurrentWorkspace()
	workspace.SwitchWorkspace("_device_check_", True)

	Xi_scales = []
	Xi_zero_points = []
	for i, X in enumerate(Xs):
	workspace.FeedBlob("X_{}".format(i), X, dc[0])
	if X.min() >= 0:
	Xi_scales.append(np.absolute(X).max() / 0xFF)
	Xi_zero_points.append(0)
	else:
	Xi_scales.append(np.absolute(X).max() / 0x7F)
	Xi_zero_points.append(128)

	workspace.RunOperatorOnce(sum_fp32)
	Y = workspace.FetchBlob("X_0" if inplace else "Y")

	if Y.min() >= 0:
	Y_scale = np.absolute(Y).max() / 0xFF
	Y_zero_point = 0
	else:
	Y_scale = np.absolute(Y).max() / 0x7F
	Y_zero_point = 128

	workspace.ResetWorkspace()

	net = caffe2_pb2.NetDef()
	for i, Xi in enumerate(Xs):
	workspace.FeedBlob("Xi_{}".format(i), Xi, dc[1])
	sw2nhwc = core.CreateOperator(
	"NCHW2NHWC",
	["Xi_{}".format(i)],
	["Xi_{}_nhwc".format(i)],
	device_option=dc[1]
	)
	quantize = core.CreateOperator(
	"Int8Quantize",
	["Xi_{}_nhwc".format(i)],
	["Xi_{}_quantized".format(i)],
	engine="DNNLOWP",
	device_option=dc[1],
	Y_zero_point=Xi_zero_points[i],
	Y_scale=Xi_scales[i],
	)
	net.op.extend([sw2nhwc, quantize])

	sum = core.CreateOperator(
	"Int8Sum",
	["Xi_{}_quantized".format(i) for i in range(inputs)],
	["Xi_0_quantized" if inplace else "Y_quantized"],
	engine="DNNLOWP",
	device_option=dc[1],
	Y_zero_point=Y_zero_point,
	Y_scale=Y_scale,
	)

	dequantize = core.CreateOperator(
	"Int8Dequantize",
	["Xi_0_quantized" if inplace else "Y_quantized"],
	["Y_nhwc"],
	engine="DNNLOWP",
	device_option=dc[1],
	)

	sw2nchw = core.CreateOperator(
	"NHWC2NCHW",
	["Y_nhwc"],
	["Y_out"],
	device_option=dc[1]
	)

	net.op.extend([sum, dequantize, sw2nchw])
	workspace.RunNetOnce(net)
	Y_out = workspace.FetchBlob("Y_out")

	MSE = np.square(np.subtract(Y, Y_out)).mean()
	if MSE > 0.005:
	print(Y.flatten())
	print(Y_out.flatten())
	print(np.max(np.abs(Y_out - Y)))
	print("MSE", MSE)
	self.assertTrue(False)

	workspace.SwitchWorkspace(old_ws_name)

	if __name__ == "__main__":
	unittest.main()