Fix test_numpy_op tests & lacking asserts (#20756)

bgawrych · Bartlomiej Gawrych · web-flow · commit f60c1d212901 · 2021-12-02T13:47:06.000+01:00
Co-authored-by: Bartlomiej Gawrych &lt;barlomiej.gawrych@intel.com&gt;
diff --git a/python/mxnet/ndarray/numpy/_op.py b/python/mxnet/ndarray/numpy/_op.py
@@ -2033,7 +2033,7 @@ def linspace(start, stop, num=50, endpoint=True, retstep=False, dtype=None, axis
     if dtype is None:
         dtype = _np.float64 if is_np_default_dtype() else _np.float32
     if retstep:
-        step = (stop - start) / (num - 1)
+        step = (stop - start) / (num - int(endpoint))
         return _api_internal.linspace(start, stop, num, endpoint, device, dtype), step
     else:
         return _api_internal.linspace(start, stop, num, endpoint, device, dtype)
diff --git a/src/operator/tensor/indexing_op.h b/src/operator/tensor/indexing_op.h
@@ -1084,6 +1084,13 @@ void TakeOpBackward(const nnvm::NodeAttrs& attrs,
       const mxnet::TShape& arrshape = outputs[0].shape_;
       const mxnet::TShape& oshape   = inputs[0].shape_;
 
+      Tensor<xpu, 2, DType> grad_in = outputs[0].get_with_shape<xpu, 2, DType>(
+          Shape2(arrshape[0], arrshape.ProdShape(1, arrshape.ndim())), s);
+
+      if (req[take_::kArr] == kWriteTo) {
+        grad_in = scalar<DType>(0.0f);
+      }
+
       if (idxshape.Size() == 0) {
         return;
       }
@@ -1100,12 +1107,7 @@ void TakeOpBackward(const nnvm::NodeAttrs& attrs,
           inputs[1].get_with_shape<xpu, 1, IType>(Shape1(idxshape.ProdShape(0, idxndim)), s);
       Tensor<xpu, 2, DType> grad_out = inputs[0].get_with_shape<xpu, 2, DType>(
           Shape2(oshape.ProdShape(0, idxndim), oshape.ProdShape(idxndim, oshape.ndim())), s);
-      Tensor<xpu, 2, DType> grad_in = outputs[0].get_with_shape<xpu, 2, DType>(
-          Shape2(arrshape[0], arrshape.ProdShape(1, arrshape.ndim())), s);
 
-      if (req[take_::kArr] == kWriteTo) {
-        grad_in = scalar<DType>(0.0f);
-      }
       // re-using the previous code for axis = 0 case
       if (actual_axis == 0) {
         if (req[take_::kArr] == kWriteTo || req[take_::kArr] == kAddTo) {
diff --git a/tests/python/unittest/test_numpy_op.py b/tests/python/unittest/test_numpy_op.py
@@ -1190,7 +1190,7 @@ def test_np_linspace(config, dtype, endpoint, retstep):
         np_ret = onp.linspace(config, endpoint=endpoint, retstep=retstep, dtype=dtype)
     if retstep:
         assert_almost_equal(mx_ret[0].asnumpy(), np_ret[0], atol=1e-3, rtol=1e-5)
-        same(mx_ret[1], np_ret[1])
+        assert same(mx_ret[1], np_ret[1])
     else:
         assert_almost_equal(mx_ret.asnumpy(), np_ret, atol=1e-3, rtol=1e-5)
 
@@ -3735,13 +3735,13 @@ def forward(self, *arys):
         np_out = funcs["numpy"][n](*tensors_np)
         for i in range(len(tensors)):
             assert mx_out[i].shape == np_out[i].shape
-            same(mx_out[i].asnumpy(), np_out[i])
+            assert same(mx_out[i].asnumpy(), np_out[i])
 
         mx_out = funcs["mxnet"][n](*tensors)
         np_out = funcs["numpy"][n](*tensors_np)
         for i in range(len(tensors)):
             assert mx_out[i].shape == np_out[i].shape
-            same(mx_out[i].asnumpy(), np_out[i])
+            assert same(mx_out[i].asnumpy(), np_out[i])
 
 
 @use_np
@@ -5760,7 +5760,7 @@ def test_np_indices():
         for shape in shapes:
             np_out = onp.indices(dimensions=shape, dtype=dtype)
             mx_out = np.indices(dimensions=shape, dtype=dtype)
-            same(mx_out.asnumpy(), np_out)
+            assert same(mx_out.asnumpy(), np_out)
             assert mx_out.shape == np_out.shape
 
     @use_np
@@ -5782,7 +5782,7 @@ def forward(self, x):
                 if hybridize:
                     net.hybridize()
                 mx_out = net(x)
-                same(mx_out.asnumpy(), np_out)
+                assert same(mx_out.asnumpy(), np_out)
                 assert mx_out.shape == np_out.shape
 
 
@@ -8470,14 +8470,18 @@ def forward(self, a, indices):
             return np.take(a, indices, axis=self._axis, mode=self._mode)
 
     def grad_helper(grad_in, axis, idx, mode):
-        k = grad_in.shape[axis]
+        k = 1 if axis == None else grad_in.shape[axis]
         if mode == 'clip':
             idx = 0 if idx < 0 else idx
             idx = k - 1 if idx >= k else idx
         else:
             idx = idx % k
+
         if axis == None:
-            grad_in[idx] += 1.0
+            if grad_in.shape == ():
+                grad_in += 1.0
+            else:
+                grad_in[idx] += 1.0
         elif axis == 0:
             if axis == len(grad_in.shape) - 1:
                 grad_in[idx] += 1.0
@@ -8506,7 +8510,8 @@ def grad_helper(grad_in, axis, idx, mode):
     def check_output_n_grad(data_shape, idx_shape, axis, mode):
         data_real = onp.random.normal(size=data_shape).astype('float32')
         idx_real = onp.random.randint(low=-100, high=100, size=idx_shape)
-        same(np.take(np.array(data_real), np.array(idx_real), axis=axis, mode=mode).asnumpy(),
+
+        assert same(np.take(np.array(data_real), np.array(idx_real), axis=axis, mode=mode).asnumpy(),
              onp.take(data_real, idx_real, axis=axis, mode=mode))
 
         grad_in = onp.zeros(data_shape, dtype='float32')
@@ -8518,15 +8523,15 @@ def check_output_n_grad(data_shape, idx_shape, axis, mode):
         x.attach_grad()
         with mx.autograd.record():
             mx_out = test_take(x, np.array(idx_real))
-        same(mx_out.asnumpy(), onp.take(data_real, idx_real, axis=axis, mode=mode))
+        assert same(mx_out.asnumpy(), onp.take(data_real, idx_real, axis=axis, mode=mode))
 
         if axis and axis < 0:
             axis += len(data_shape)
-        try:
+
+        if idx_real.size != 0:
             for i in onp.nditer(idx_real):
                 grad_helper(grad_in, axis, i, mode)
-        except:
-            pass
+
 
         mx_out.backward()
         same(x.grad.asnumpy(), grad_in)
@@ -10195,7 +10200,7 @@ def forward(self, cond, x, y):
     ]
     flags = [True, False]
     for ctype, dtype, shape_pair, hybridize in itertools.product(dtypes, dtypes, shape_configs, flags):
-        cond = np.random.uniform(low=0, high=100, size=shape_pair[0], dtype='float64').astype(ctype)
+        cond = np.round(np.random.uniform(low=0, high=2, size=shape_pair[0], dtype='float64')).astype(ctype)
         x = np.random.uniform(low=0, high=100, size=shape_pair[1], dtype='float64').astype(dtype)
         y = np.random.uniform(low=0, high=100, size=shape_pair[2], dtype='float64').astype(dtype)
         cond.attach_grad()
@@ -10206,37 +10211,50 @@ def forward(self, cond, x, y):
             test_mod.hybridize()
         with mx.autograd.record():
             ret = test_mod(cond, x, y)
-        same(ret.asnumpy(), onp.where(cond.asnumpy(), x.asnumpy(), y.asnumpy()))
+
+        assert same(ret.asnumpy(), onp.where(cond.asnumpy(), x.asnumpy(), y.asnumpy()))
         if dtype in [np.float16, np.float32, np.float64]:
             ret.backward()
-            same(cond.grad.asnumpy(), onp.zeros(shape_pair[0], dtype=ctype))
-            same(x.grad.asnumpy(), collapse_sum_like(onp.broadcast_to(cond.asnumpy(), ret.shape), shape_pair[1]))
+            assert same(cond.grad.asnumpy(), onp.zeros(shape_pair[0], dtype=ctype))
+
+            xgrad = x.grad.asnumpy()
+            npgrad = collapse_sum_like((onp.broadcast_to(cond.asnumpy(), ret.shape) != 0).astype(dtype), shape_pair[1])
+            npgrad = npgrad.astype(xgrad.dtype)
+            assert same(xgrad, npgrad)
 
         # check imperative again
         ret = np.where(cond, x, y)
-        same(ret.asnumpy(), onp.where(cond.asnumpy(), x.asnumpy(), y.asnumpy()))
+        assert same(ret.asnumpy(), onp.where(cond.asnumpy(), x.asnumpy(), y.asnumpy()))
 
         # check scalar case
         if dtype in [np.float16, np.float32, np.float64]:
             # lscalar
             with mx.autograd.record():
                 ret_lscalar = np.where(cond, 1, x)
-            same(ret.asnumpy(), onp.where(cond.asnumpy(), 1, x.asnumpy()))
+            assert same(ret_lscalar.asnumpy(), onp.where(cond.asnumpy(), 1, x.asnumpy()))
             ret_lscalar.backward()
-            same(x.grad.asnumpy(), 1-collapse_sum_like(onp.broadcast_to(cond.asnumpy(), ret.shape), shape_pair[1]))
+
+            xgrad = x.grad.asnumpy()
+            npgrad = collapse_sum_like((onp.broadcast_to(cond.asnumpy(), ret_lscalar.shape) == 0).astype(dtype), shape_pair[1])
+            npgrad = npgrad.astype(xgrad.dtype)
+            assert same(xgrad, npgrad)
             # rscalar
             with mx.autograd.record():
                 ret_rscalar = np.where(cond, x, 1)
-            same(ret.asnumpy(), onp.where(cond.asnumpy(), x.asnumpy(), 1))
+            assert same(ret_rscalar.asnumpy(), onp.where(cond.asnumpy(), x.asnumpy(), 1))
             ret_rscalar.backward()
-            same(x.grad.asnumpy(), collapse_sum_like(onp.broadcast_to(cond.asnumpy(), ret.shape), shape_pair[1]))
+
+            xgrad = x.grad.asnumpy()
+            npgrad = collapse_sum_like((onp.broadcast_to(cond.asnumpy(), ret_rscalar.shape) != 0).astype(dtype), shape_pair[1])
+            npgrad = npgrad.astype(xgrad.dtype)
+            assert same(xgrad, npgrad)
 
         # check both scalar case
         x = onp.random.randint(0, 100)
         y = onp.random.randint(0, 100)
         mx_out = np.where(cond, x, y)
         np_out = onp.where(cond, x, y)
-        same(mx_out, np_out)
+        assert same(mx_out, np_out)
 
 
 @use_np