[VTA] Hotfix for padded load test in Chisel VTA (#4264)

* Update TensorUtil.scala

* Update test_vta_insn.py
diff --git a/hardware/chisel/src/main/scala/core/TensorUtil.scala b/hardware/chisel/src/main/scala/core/TensorUtil.scala
index 1f00554..99e9012 100644
--- a/hardware/chisel/src/main/scala/core/TensorUtil.scala
+++ b/hardware/chisel/src/main/scala/core/TensorUtil.scala
@@ -319,8 +319,8 @@
     when(split) {
       caddr := caddr + xmax_bytes
     }.elsewhen(stride) {
-      caddr := baddr + (dec.xstride << log2Ceil(strideFactor))
-      baddr := baddr + (dec.xstride << log2Ceil(strideFactor))
+      caddr := baddr + (dec.xstride << log2Ceil(elemBytes))
+      baddr := baddr + (dec.xstride << log2Ceil(elemBytes))
     }
   }
 
diff --git a/tests/python/unittest/test_vta_insn.py b/tests/python/unittest/test_vta_insn.py
index 25d7d8c..574273f 100644
--- a/tests/python/unittest/test_vta_insn.py
+++ b/tests/python/unittest/test_vta_insn.py
@@ -89,10 +89,10 @@
     """Test padded load."""
     def _run(env, remote):
         # declare
-        n = 21
-        m = 20
-        pad_before = [0, 1, 0, 0]
-        pad_after = [1, 3, 0, 0]
+        n = 3
+        m = 5
+        pad_before = [2, 1, 0, 0]
+        pad_after = [1, 2, 0, 0]
         x = tvm.placeholder(
             (n, m, env.BATCH, env.BLOCK_OUT),
             name="x",
@@ -126,7 +126,7 @@
         f = remote.load_module("padded_load.o")
         # verify
         ctx = remote.ext_dev(0)
-        x_np = np.random.randint(1, 2, size=(
+        x_np = np.random.randint(-10, 10, size=(
             n, m, env.BATCH, env.BLOCK_OUT)).astype(x.dtype)
         y_np = np.zeros((n + pad_before[0] + pad_after[0],
                          m + pad_before[1] + pad_after[1],