[TOPI] Fix mali conv2d performance regression (#3131)

* [TOPI] fix mali conv * fix typo * address comments

[TOPI] Fix mali conv2d performance regression (#3131)
* [TOPI] fix mali conv * fix typo * address comments
88daa2bc · Lianmin Zheng · Yizhi Liu · 48c92376 · 88daa2bc · 88daa2bc
Commit 88daa2bc authored May 05, 2019 by Lianmin Zheng Committed by Yizhi Liu May 05, 2019
Hide whitespace changes
Inline Side-by-side

Showing with 6 additions and 4 deletions

python/tvm/autotvm/tophub.py
+1 -1

topi/python/topi/mali/conv2d.py
+5 -3

No files found.
--- a/python/tvm/autotvm/tophub.py
+++ b/python/tvm/autotvm/tophub.py
@@ -42,7 +42,7 @@ PACKAGE_VERSION = {
    'cuda':    "v0.04",
    'rocm':    "v0.02",
    'opencl':  "v0.02",
-    'mali':    "v0.04",
+    'mali':    "v0.05",
    'vta':     "v0.04",
 }

--- a/topi/python/topi/mali/conv2d.py
+++ b/topi/python/topi/mali/conv2d.py
@@ -352,9 +352,11 @@ def _decl_winograd(cfg, data, kernel, strides, padding, dilation, layout, out_dt
    # unpack output
    output = tvm.compute((N, CO, H, W), lambda n, co, h, w:
                         Y[co][n * nH * nW + (h//m) * nW + w//m][h % m][w % m]
-                         # thw following term is used to make the padding effective,
+                         # The following hack term is used to make the padding in batch gemm ("M")
-                         # otherwise the padding will be eliminated by bound inference
+                         # effective, otherwise the padding will be eliminated by bound inference.
-                         + tvm.const(0, out_dtype) * M[alpha-1][alpha-1][CO-1][P_round-1],
+                         # Use `tvm.expr.Mul` instead of `*` to avoid issues in const folding.
+                         + tvm.expr.Mul(tvm.const(0, out_dtype),
+                                        M[alpha-1][alpha-1][CO-1][P_round-1]),
                         name='output', tag='winograd_conv2d_output')
    # we have to manually assign effective GFLOP for winograd