Generalize pooling to support arbitrary layout (#1103)

* generalize pool2d to arbitrary layout * explain more the layout support for pool * allow missing factor size for pooling * explain what factor size is used for * fix typo * name idx -> axis

Generalize pooling to support arbitrary layout (#1103)
* generalize pool2d to arbitrary layout * explain more the layout support for pool * allow missing factor size for pooling * explain what factor size is used for * fix typo * name idx -> axis
c6b1020b · Yizhi Liu · Tianqi Chen · 154104b3 · c6b1020b · c6b1020b
Commit c6b1020b authored Apr 19, 2018 by Yizhi Liu Committed by Tianqi Chen Apr 19, 2018
6 changed files
--- a/topi/include/topi/cuda/pooling.h
+++ b/topi/include/topi/cuda/pooling.h
@@ -33,7 +33,9 @@ inline Schedule schedule_pool(const Target &target, const Array<Tensor>& outs) {
  auto s = create_schedule(out_ops);
  auto _schedule = [&](const Tensor& padded_input, const Tensor& pool) {
-    s[padded_input].compute_inline();
+    if (padded_input->op->is_type<ComputeOpNode>()) {
+      s[padded_input].compute_inline();
+    }
    auto num_thread = target->max_num_threads;
    Tensor out;
    Tensor OL;

--- a/topi/include/topi/nn/pooling.h
+++ b/topi/include/topi/nn/pooling.h
--- a/topi/python/topi/cuda/pooling.py
+++ b/topi/python/topi/cuda/pooling.py
@@ -84,7 +84,8 @@ def schedule_pool(outs):
    outs = [outs] if isinstance(outs, tvm.tensor.Tensor) else outs
    s = tvm.create_schedule([x.op for x in outs])
    def _schedule(PaddedInput, Pool):
-        s[PaddedInput].compute_inline()
+        if isinstance(PaddedInput.op, tvm.tensor.ComputeOp):
+            s[PaddedInput].compute_inline()
        num_thread = tvm.target.current_target(allow_none=False).max_num_threads
        if Pool.op in s.outputs:
            Out = Pool

--- a/topi/python/topi/nn/pooling.py
+++ b/topi/python/topi/nn/pooling.py
--- a/topi/python/topi/opengl/pooling.py
+++ b/topi/python/topi/opengl/pooling.py
@@ -67,7 +67,8 @@ def schedule_pool(outs):
    outs = [outs] if isinstance(outs, tvm.tensor.Tensor) else outs
    s = tvm.create_schedule([x.op for x in outs])
    def _schedule(PaddedInput, Pool):
-        s[PaddedInput].opengl()
+        if isinstance(PaddedInput.op, tvm.tensor.ComputeOp):
+            s[PaddedInput].opengl()
        if Pool.op in s.outputs:
            Out = Pool
        else:

--- a/topi/python/topi/x86/injective.py
+++ b/topi/python/topi/x86/injective.py
@@ -27,6 +27,10 @@ def schedule_injective(outs):
        n, c, _, _ = s[x].op.axis
        fused = s[x].fuse(n, c) # for nhwc layout, fuse n and h
        s[x].parallel(fused)
+    elif len(s[x].op.axis) == 5:
+        n, C, h, _, _ = s[x].op.axis
+        fused = s[x].fuse(n, C, h)
+        s[x].parallel(fused)
    else:
        s[x].parallel(s[x].op.axis[0])
    return s