[TOPI] Formalize the tag system (#473)

31fb14e4 · Tianqi Chen · GitHub · 0a6c36ce · 31fb14e4 · 31fb14e4
Commit 31fb14e4 authored Sep 22, 2017 by Tianqi Chen Committed by GitHub Sep 22, 2017
24 changed files
--- a/topi/include/topi/tags.h
+++ b/topi/include/topi/tags.h
@@ -8,8 +8,8 @@

 namespace topi {

-constexpr auto kElementWise = "ewise";
-constexpr auto kBroadcast = "bcast";
+constexpr auto kElementWise = "elemwise";
+constexpr auto kBroadcast = "broadcast";
 constexpr auto kMatMult = "matmult";
 constexpr auto kConv2dNCHW = "conv2d_nchw";
 constexpr auto kConv2dHWCN = "conv2d_hwcn";

--- a/topi/python/topi/__init__.py
+++ b/topi/python/topi/__init__.py
@@ -11,6 +11,7 @@ from __future__ import absolute_import as _abs

 from .math import *
 from .reduction import *
+from .transform import *
 from .broadcast import *
 from . import nn
 from . import cuda

--- a/topi/python/topi/broadcast.py
+++ b/topi/python/topi/broadcast.py
@@ -2,6 +2,7 @@
 """Broadcast operators"""
 from __future__ import absolute_import as _abs
 import tvm
+from .import tag
 from .util import get_const_tuple, equal_const_int

 def _get_bcast_info(original_shape, target_shape):
@@ -113,7 +114,7 @@ def broadcast_to(data, shape):
    return ret


-@tvm.tag_scope(tag="broadcast_binary_op")
+@tvm.tag_scope(tag=tag.BROADCAST)
 def broadcast_binary_op(lhs, rhs, func, name="bop"):
    """Binary operands that will automatically broadcast the inputs


--- a/topi/python/topi/cuda/__init__.py
+++ b/topi/python/topi/cuda/__init__.py
@@ -8,6 +8,5 @@ from .depthwise_conv2d import schedule_depthwise_conv2d_nchw, schedule_depthwise
 from .depthwise_conv2d import schedule_depthwise_conv2d_backward_input_nhwc
 from .depthwise_conv2d import schedule_depthwise_conv2d_backward_weight_nhwc
 from .reduction import schedule_reduce
-from .broadcast import schedule_broadcast
 from .softmax import schedule_softmax
-from .elemwise import schedule_elemwise
+from .injective import schedule_injective, schedule_elemwise, schedule_broadcast
--- a/topi/python/topi/cuda/broadcast.py
+++ b/topi/python/topi/cuda/broadcast.py
-# pylint: disable=invalid-name,unused-variable
-"""Schedule for broadcast operators"""
-from __future__ import absolute_import as _abs
-import tvm
-
-from .elemwise import _schedule_elemwise
-
-
-def schedule_broadcast(outs):
-    """Schedule for broadcasting ops (broadcast_to + broadcast binary) + element-wise ops.
-
-    Parameters
-    ----------
-    outs: Array of Tensor
-          The computation graph description of broadcast_to in the format
-          of an array of tensors.
-
-    Returns
-    -------
-    sch: Schedule
-        The computation schedule for the op.
-    """
-    outs = [outs] if isinstance(outs, tvm.tensor.Tensor) else outs
-    sch = tvm.create_schedule([x.op for x in outs])
-    def traverse(operator):
-        if operator.tag == 'ewise' or operator.tag == 'scale_shift':
-            if operator not in sch.outputs:
-                sch[operator].compute_inline()
-            for tensor in operator.input_tensors:
-                if tensor.op.input_tensors:
-                    traverse(tensor.op)
-        elif operator.tag == 'broadcast_to' or operator.tag == 'broadcast_binary_op':
-            _schedule_elemwise(operator, sch)
-        else:
-            raise RuntimeError("Unsupported operator: %s" % operator.tag)
-
-    traverse(outs[0].op)
-    return sch
--- a/topi/python/topi/cuda/conv2d_hwcn.py
+++ b/topi/python/topi/cuda/conv2d_hwcn.py
 # pylint: disable=invalid-name, too-many-locals, too-many-statements
 """Schedule for conv2d_hwcn with auto fusion"""
 import tvm
-
+from .. import tag

 def schedule_conv2d_hwcn(outs):
    """Schedule for conv2d_hwcn and any element-wise operations.
@@ -101,7 +101,7 @@ def schedule_conv2d_hwcn(outs):

    def traverse(operator):
        """Traverse operators from computation graph"""
-        if operator.tag == 'ewise' or operator.tag == 'scale_shift':
+        if tag.is_broadcast(operator.tag):
            if operator not in sch.outputs:
                sch[operator].compute_inline()
            for tensor in operator.input_tensors:

--- a/topi/python/topi/cuda/conv2d_nchw.py
+++ b/topi/python/topi/cuda/conv2d_nchw.py
@@ -2,6 +2,7 @@
 """Schedule for conv2d_nchw with auto fusion"""
 import tvm
 from .. import util
+from .. import tag

 def conv2d_224_3_64(s, temp_S, Filter_S, Out, Out_L):
    """Schedule conv2d for specific feature_in_out_filter pattern"""
@@ -389,7 +390,7 @@ def schedule_conv2d_small_batch(outs):
    def traverse(OP):
        """Traverse operators from computation graph"""
        # inline all one-to-one-mapping operators except the last stage (output)
-        if 'ewise' in OP.tag or 'bcast' in OP.tag:
+        if tag.is_broadcast(OP.tag):
            if OP not in s.outputs:
                s[OP].compute_inline()
            for tensor in OP.input_tensors:

--- a/topi/python/topi/cuda/depthwise_conv2d.py
+++ b/topi/python/topi/cuda/depthwise_conv2d.py
@@ -2,6 +2,7 @@
 """Schedule for depthwise_conv2d with auto fusion"""
 import tvm
 from ..util import get_const_tuple
+from .. import tag

 def schedule_depthwise_conv2d_nchw(outs):
    """Schedule for depthwise_conv2d nchw forward.
@@ -100,7 +101,7 @@ def schedule_depthwise_conv2d_nchw(outs):

    def traverse(OP):
        # inline all one-to-one-mapping operators except the last stage (output)
-        if 'ewise' in OP.tag or 'bcast' in OP.tag:
+        if tag.is_broadcast(OP.tag):
            if OP not in s.outputs:
                s[OP].compute_inline()
            for tensor in OP.input_tensors:
@@ -171,7 +172,7 @@ def schedule_depthwise_conv2d_nhwc(outs):

    def traverse(OP):
        # inline all one-to-one-mapping operators except the last stage (output)
-        if 'ewise' in OP.tag or 'bcast' in OP.tag:
+        if tag.is_broadcast(OP.tag):
            if OP not in s.outputs:
                s[OP].compute_inline()
            for tensor in OP.input_tensors:

--- a/topi/python/topi/cuda/elemwise.py
+++ b/topi/python/topi/cuda/elemwise.py
-# pylint: disable=invalid-name, unused-variable, trailing-whitespace, no-member
-"""Schedule for element wise operator"""
+# pylint: disable=invalid-name, unused-variable,
+"""Schedule for composition of injective operator"""
 import tvm

-
-def _schedule_elemwise(op, sch):
+def _schedule_injective(op, sch):
    x = op.output(0)
    fused = sch[x].fuse(*sch[x].op.axis)
    num_thread = 512
@@ -13,8 +12,8 @@ def _schedule_elemwise(op, sch):
    return sch


-def schedule_elemwise(outs):
-    """Schedule for element wise op.
+def schedule_injective(outs):
+    """Schedule for injective op.

    Parameters
    ----------
@@ -31,4 +30,7 @@ def schedule_elemwise(outs):
    s = tvm.create_schedule([x.op for x in outs])

    tvm.schedule.AutoInlineInjective(s)
-    return _schedule_elemwise(outs[0].op, s)
+    return _schedule_injective(outs[0].op, s)
+
+schedule_elemwise = schedule_injective
+schedule_broadcast = schedule_injective
--- a/topi/python/topi/cuda/reduction.py
+++ b/topi/python/topi/cuda/reduction.py
@@ -2,7 +2,7 @@
 """Schedule for reduce operators"""
 from __future__ import absolute_import as _abs
 import tvm
-
+from .. import tag

 def _schedule_reduce(op, sch):
    data_in = op.input_tensors[0]
@@ -42,7 +42,7 @@ def _schedule_reduce(op, sch):


 def schedule_reduce(outs):
-    """Schedule for reduce ops + ewise + scale_shift ops.
+    """Schedule for inject->reduce->bcast ops.

    Parameters
    ----------
@@ -58,7 +58,7 @@ def schedule_reduce(outs):
    outs = [outs] if isinstance(outs, tvm.tensor.Tensor) else outs
    sch = tvm.create_schedule([x.op for x in outs])
    def traverse(operator):
-        if operator.tag == 'ewise' or operator.tag == 'scale_shift':
+        if tag.is_injective(operator.tag):
            if operator not in sch.outputs:
                sch[operator].compute_inline()
            for tensor in operator.input_tensors:

--- a/topi/python/topi/math.py
+++ b/topi/python/topi/math.py
 """Elementwise operators"""
 from __future__ import absolute_import as _abs
 import tvm
+from . import tag

-@tvm.tag_scope(tag='ewise')
+@tvm.tag_scope(tag=tag.ELEMWISE)
 def identity(x):
    """Take identity of input x.

@@ -20,9 +21,9 @@ def identity(x):
    return tvm.compute(x.shape, lambda *i: x(*i))


-@tvm.tag_scope(tag='ewise')
+@tvm.tag_scope(tag=tag.ELEMWISE)
 def negative(x):
-    """Take negative of input x.
+    """Take negation of input x.

    Parameters
    ----------
@@ -38,7 +39,7 @@ def negative(x):
    return tvm.compute(x.shape, lambda *i: -x(*i))


-@tvm.tag_scope(tag="ewise")
+@tvm.tag_scope(tag=tag.ELEMWISE)
 def exp(x):
    """Take exponential of input x.

@@ -55,7 +56,7 @@ def exp(x):
    return tvm.compute(x.shape, lambda *i: tvm.exp(x(*i)))


-@tvm.tag_scope(tag="ewise")
+@tvm.tag_scope(tag=tag.ELEMWISE)
 def tanh(x):
    """Take hyperbolic tanh of input x.

@@ -72,7 +73,7 @@ def tanh(x):
    return tvm.compute(x.shape, lambda *i: tvm.tanh(x(*i)))


-@tvm.tag_scope(tag="ewise")
+@tvm.tag_scope(tag=tag.ELEMWISE)
 def log(x):
    """Take logarithm of input x.

@@ -89,7 +90,7 @@ def log(x):
    return tvm.compute(x.shape, lambda *i: tvm.log(x(*i)))


-@tvm.tag_scope(tag="ewise")
+@tvm.tag_scope(tag=tag.ELEMWISE)
 def sqrt(x):
    """Take square root of input x.

@@ -106,7 +107,7 @@ def sqrt(x):
    return tvm.compute(x.shape, lambda *i: tvm.sqrt(x(*i)))


-@tvm.tag_scope(tag="ewise")
+@tvm.tag_scope(tag=tag.ELEMWISE)
 def sigmoid(x):
    """Take sigmoid tanh of input x.


--- a/topi/python/topi/nn/batch_norm.py
+++ b/topi/python/topi/nn/batch_norm.py
 """TVM operator batch normalization compute."""
 from __future__ import absolute_import
 import tvm
+from .. import tag

-@tvm.tag_scope(tag='batch_norm')
-def batch_norm(data, gamma, beta, moving_mean, moving_var, eps, fix_gamma):
-    """Batch normalization operator in NCHW layout.
+@tvm.tag_scope(tag=tag.BROADCAST)
+def batch_norm_inference(data, gamma, beta, moving_mean, moving_var, eps, fix_gamma):
+    """Batch normalization inference operator in NCHW layout.

    Parameters
    ----------

--- a/topi/python/topi/nn/convolution.py
+++ b/topi/python/topi/nn/convolution.py
@@ -93,6 +93,7 @@ def _get_workload(data, kernel, stride, padding):
        HSTR, WSTR = stride, stride
    return Workload(IH, IW, CI, CO, KH, KW, HPAD, WPAD, HSTR, WSTR)

+
 def _get_schedule(wkl, target=None):
    """ Get the platform specific schedule. """
    if target is None:

--- a/topi/python/topi/nn/dilate.py
+++ b/topi/python/topi/nn/dilate.py
@@ -3,9 +3,9 @@
 from __future__ import absolute_import as _abs
 import tvm
 from .. import util
+from .. import tag

-
-@tvm.tag_scope(tag="dilation")
+@tvm.tag_scope(tag=tag.INJECTIVE)
 def dilate(data, strides, name="DilatedInput"):
    """Dilate data with zeros.


--- a/topi/python/topi/nn/elemwise.py
+++ b/topi/python/topi/nn/elemwise.py
 """Elementwise operators"""
 from __future__ import absolute_import as _abs
 import tvm
+from .. import tag

-@tvm.tag_scope(tag="ewise")
+@tvm.tag_scope(tag=tag.ELEMWISE)
 def relu(x):
    """Take relu of input x.


--- a/topi/python/topi/nn/flatten.py
+++ b/topi/python/topi/nn/flatten.py
 """TVM operator flatten compute."""
 from __future__ import absolute_import
 import tvm
+from .. import tag

-@tvm.tag_scope(tag='flatten')
+@tvm.tag_scope(tag=tag.INJECTIVE)
 def flatten(data):
    """Flattens the input array into a 2-D array by collapsing the higher dimensions.


--- a/topi/python/topi/nn/mapping.py
+++ b/topi/python/topi/nn/mapping.py
@@ -2,8 +2,9 @@
 """Operators of one-to-one-mapping on the first input"""
 from __future__ import absolute_import as _abs
 import tvm
+from .. import tag

-@tvm.tag_scope(tag="bcast_scale_shift_nchw")
+@tvm.tag_scope(tag=tag.BROADCAST)
 def scale_shift_nchw(Input, Scale, Shift):
    """Batch normalization operator in inference.

@@ -25,7 +26,8 @@ def scale_shift_nchw(Input, Scale, Shift):
    """
    return tvm.compute(Input.shape, lambda b, c, i, j: Input[b, c, i, j] * Scale[c] + Shift[c], name='ScaleShift')

-@tvm.tag_scope(tag="bcast_scale_shift_nhwc")
+
+@tvm.tag_scope(tag=tag.BROADCAST)
 def scale_shift_nhwc(Input, Scale, Shift):
    """Batch normalization operator in inference.


--- a/topi/python/topi/nn/pad.py
+++ b/topi/python/topi/nn/pad.py
@@ -2,8 +2,9 @@
 from __future__ import absolute_import as _abs
 import tvm
 from ..util import equal_const_int
+from .. import tag

-@tvm.tag_scope(tag="pad")
+@tvm.tag_scope(tag=tag.INJECTIVE+",pad")
 def pad(data, pad_before, pad_after=None, pad_value=0.0, name="PadInput"):
    """Dilate Input with zeros.


--- a/topi/python/topi/rasp/convolution.py
+++ b/topi/python/topi/rasp/convolution.py
@@ -3,6 +3,7 @@
 from __future__ import absolute_import as _abs
 import tvm
 from .. import target as _target
+from .. import tag
 from ..nn.convolution import SpatialPack, Im2ColPack
 from ..nn.convolution import _CONV_DECLARATION, _CONV_SCHEDULE
 from ..nn.convolution import _WORKLOADS, _SCH_TO_DECL_FUNC
@@ -270,7 +271,7 @@ def schedule_convolution(outs):
    def traverse(op):
        """Traverse operators from computation graph"""
        # inline all one-to-one-mapping operators except the last stage (output)
-        if 'ewise' in op.tag or 'bcast' in op.tag:
+        if tag.is_broadcast(op.tag):
            if op not in s.outputs:
                s[op].compute_inline()
            for tensor in op.input_tensors:

--- a/topi/python/topi/reduction.py
+++ b/topi/python/topi/reduction.py
@@ -2,7 +2,7 @@
 """Reduce operators"""
 from __future__ import absolute_import as _abs
 import tvm
-
+from . import tag

 def _get_real_axis(ndim, axis):
    if axis is None:
@@ -37,7 +37,7 @@ def get_reduce_out_shape(src_shape, axis=None, keepdims=False):
    return dst_shape


-@tvm.tag_scope(tag="comm_reduce")
+@tvm.tag_scope(tag=tag.COMM_REDUCE)
 def comm_reduce(data, axis=None, keepdims=False, func=tvm.sum):
    """Reducing the data


--- a/topi/python/topi/tag.py
+++ b/topi/python/topi/tag.py
+"""Namespace of all tag system in tvm
+
+Each operator can be tagged by a tag, which indicate its type.
+
+Generic categories
+
+- tag.ELEMWISE="elemwise":
+   Elementwise operator, for example :code:`out[i, j] = input[i, j]`
+- tag.BROADCAST="broadcast":
+    Broadcasting operator, can always map output axis to the input in order.
+    for example :code:`out[i, ax1, j, ax2] = input[i, j]`.
+    Note that the axis need to be in order so transpose is not a bcast operator.
+    If an input of broadcast operator has same shape as output,
+    we can ensure that it is elementwise relation.
+- tag.INJECTIVE="injective":
+    Injective operator, can always injectively map output axis to a single input axis.
+    All injective operator can still be safely fused similar to ewise to reduction.
+
+- tag.COMM_REDUCE="comm_reduce":
+    Communicative reduction operator
+- If an op does not belong to these generic categories, it should have a special tag.
+
+Note
+----
+When we add a new topi operator, the op need to be tagged as generic as possible.
+We can also compose tags like "injective,pad" to give generic and specific information.
+When we use composed tags, we must always put generic tag in the first location.
+"""
+
+ELEMWISE = "elemwise"
+BROADCAST = "broadcast"
+INJECTIVE = "injective"
+COMM_REDUCE = "comm_reduce"
+
+
+def is_broadcast(tag):
+    """Check if a tag is bcast
+
+    Parameters
+    ----------
+    tag : str
+        The input tag
+
+    Returns
+    -------
+    ret : bool
+        Whether a tag is broadcast
+    """
+    if tag in (ELEMWISE, BROADCAST):
+        return True
+    return tag.startswith(ELEMWISE) or tag.startswith(BROADCAST)
+
+
+def is_injective(tag):
+    """Check if a tag is injective
+
+    Parameters
+    ----------
+    tag : str
+        The input tag
+
+    Returns
+    -------
+    ret : bool
+        Whether a tag is injective
+    """
+    if tag in (ELEMWISE, BROADCAST, INJECTIVE):
+        return True
+    return (tag.startswith(ELEMWISE) or
+            tag.startswith(BROADCAST) or
+            tag.startswith(INJECTIVE))
--- a/topi/python/topi/transform.py
+++ b/topi/python/topi/transform.py
+"""Injective transformation operators"""
+from __future__ import absolute_import as _abs
+import tvm
+from . import tag
+
+@tvm.tag_scope(tag=tag.BROADCAST)
+def expand_dims(a, axis, num_newaxis=1):
+    """Expand the shape of an array.
+
+    Parameters
+    ----------
+    a : tvm.Tensor
+        The tensor to be expanded.
+
+    num_newaxis: int, optional
+        Number of newaxis to be inserted on axis
+
+    Returns
+    -------
+    ret : tvm.Tensor
+    """
+    axis = len(a.shape) + axis + 1 if axis < 0 else axis
+    new_shape = a.shape[:axis] + ([1] * num_newaxis) + a.shape[axis:]
+    def _compute(*indices):
+        idx = indices[:axis] + indices[axis + num_newaxis:]
+        return a(*idx)
+    return tvm.compute(new_shape, _compute)
--- a/topi/tests/python/test_topi_convolution.py
+++ b/topi/tests/python/test_topi_convolution.py
@@ -16,7 +16,6 @@ def verify_convolution(batch, in_size, in_channel, num_filter, kernel, stride, p
        B = topi.nn.convolution(A, W, stride, padding)

    s = topi.rasp.schedule_convolution([B])
-
    a_shape = get_const_tuple(A.shape)
    w_shape = get_const_tuple(W.shape)
    dtype = A.dtype

--- a/topi/tests/python/test_topi_transform.py
+++ b/topi/tests/python/test_topi_transform.py
+"""Test code for broadcasting operators."""
+import numpy as np
+import tvm
+import topi
+
+def verify_expand_dims(in_shape, out_shape, axis, num_newaxis):
+    A = tvm.placeholder(shape=in_shape, name="A")
+    B = topi.expand_dims(A, axis, num_newaxis)
+    s = topi.cuda.schedule_broadcast(B)
+    def check_device(device):
+        if not tvm.module.enabled(device):
+            print("Skip because %s is not enabled" % device)
+            return
+        ctx = tvm.gpu(0) if device == "cuda" else tvm.cl(0)
+        foo = tvm.build(s, [A, B], device, name="expand_dims")
+        data_npy = np.random.uniform(size=in_shape).astype(A.dtype)
+        out_npy = data_npy.reshape(out_shape)
+
+        data_nd = tvm.nd.array(data_npy, ctx)
+        out_nd = tvm.nd.array(np.empty(out_shape).astype(B.dtype), ctx)
+        foo(data_nd, out_nd)
+        np.testing.assert_allclose(out_nd.asnumpy(), out_npy)
+
+    check_device("opencl")
+    check_device("cuda")
+    check_device("metal")
+
+
+def test_expand_dims():
+    verify_expand_dims((3, 10), (3, 10, 1, 1), 2, 2)
+
+
+if __name__ == "__main__":
+    test_expand_dims()