[INTRIN] Enable pow (#471)

* [INTRIN] Enable pow * rename pow->power * fix

[INTRIN] Enable pow (#471)
* [INTRIN] Enable pow * rename pow->power * fix
0a6c36ce · Tianqi Chen · GitHub · 87b95e2e · 0a6c36ce · 0a6c36ce
Commit 0a6c36ce authored Sep 22, 2017 by Tianqi Chen Committed by GitHub Sep 22, 2017
Showing with 35 additions and 4 deletions

python/tvm/intrin.py
+19 -0

src/codegen/intrin_rule.cc
+3 -0

src/codegen/intrin_rule_cuda.cc
+3 -0

src/codegen/intrin_rule_opencl.cc
+3 -0

src/codegen/llvm/intrin_rule_llvm.cc
+3 -0

tests/python/integration/test_ewise.py
+4 -4

No files found.
--- a/python/tvm/intrin.py
+++ b/python/tvm/intrin.py
@@ -206,6 +206,25 @@ def sqrt(x):
    return call_pure_intrin(x.dtype, "sqrt", x)


+def power(x, y):
+    """x power y
+
+    Parameters
+    ----------
+    x : Expr
+        Input argument.
+
+    y : Expr
+        The exponent
+
+    Returns
+    -------
+    z : Expr
+        The result.
+    """
+    return call_pure_intrin(x.dtype, "pow", x, y)
+
+
 # Intrinsic rule related code
 def register_intrin_rule(target, intrin, f=None, override=False):
    """Register an intrinsic function generation rule.

--- a/src/codegen/intrin_rule.cc
+++ b/src/codegen/intrin_rule.cc
@@ -21,6 +21,9 @@ TVM_REGISTER_GLOBAL("tvm.intrin.rule.default.tanh")
 TVM_REGISTER_GLOBAL("tvm.intrin.rule.default.sqrt")
 .set_body(DispatchExtern<FloatSuffix>);

+TVM_REGISTER_GLOBAL("tvm.intrin.rule.default.pow")
+.set_body(DispatchExtern<FloatSuffix>);
+
 }  // namespace intrin
 }  // namespace codegen
 }  // namespace tvm
--- a/src/codegen/intrin_rule_cuda.cc
+++ b/src/codegen/intrin_rule_cuda.cc
@@ -48,6 +48,9 @@ TVM_REGISTER_GLOBAL("tvm.intrin.rule.cuda.tanh")
 TVM_REGISTER_GLOBAL("tvm.intrin.rule.cuda.sqrt")
 .set_body(DispatchExtern<CUDAMath>);

+TVM_REGISTER_GLOBAL("tvm.intrin.rule.cuda.pow")
+.set_body(DispatchExtern<CUDAMath>);
+
 }  // namespace intrin
 }  // namespace codegen
 }  // namespace tvm
--- a/src/codegen/intrin_rule_opencl.cc
+++ b/src/codegen/intrin_rule_opencl.cc
@@ -21,6 +21,9 @@ TVM_REGISTER_GLOBAL("tvm.intrin.rule.opencl.tanh")
 TVM_REGISTER_GLOBAL("tvm.intrin.rule.opencl.sqrt")
 .set_body(DispatchExtern<FloatDirect>);

+TVM_REGISTER_GLOBAL("tvm.intrin.rule.opencl.pow")
+.set_body(DispatchExtern<FloatDirect>);
+
 }  // namespace intrin
 }  // namespace codegen
 }  // namespace tvm
--- a/src/codegen/llvm/intrin_rule_llvm.cc
+++ b/src/codegen/llvm/intrin_rule_llvm.cc
@@ -76,6 +76,9 @@ TVM_REGISTER_GLOBAL("tvm.intrin.rule.llvm.log")
 TVM_REGISTER_GLOBAL("tvm.intrin.rule.llvm.sqrt")
 .set_body(DispatchLLVMPureIntrin<::llvm::Intrinsic::sqrt>);

+TVM_REGISTER_GLOBAL("tvm.intrin.rule.llvm.pow")
+.set_body(DispatchLLVMPureIntrin<::llvm::Intrinsic::pow>);
+
 }  // namespace llvm
 }  // namespace codegen
 }  // namespace tvm

--- a/tests/python/integration/test_ewise.py
+++ b/tests/python/integration/test_ewise.py
@@ -36,11 +36,11 @@ def test_exp():
    check_device("opencl")


-def test_log_llvm():
+def test_log_pow_llvm():
    # graph
    n = tvm.var('n')
    A = tvm.placeholder((n,), name='A')
-    B = tvm.compute(A.shape, lambda *i: tvm.log(A(*i)), name='B')
+    B = tvm.compute(A.shape, lambda *i: tvm.power(tvm.log(A(*i)), 2.0), name='B')
    s = tvm.create_schedule(B.op)
    # create iter var and assign them tags.
    bx, tx = s[B].split(B.op.axis[0], factor=32)
@@ -57,7 +57,7 @@ def test_log_llvm():
    b = tvm.nd.array(np.zeros(n, dtype=B.dtype), ctx)
    flog(a, b)
    np.testing.assert_allclose(
-        b.asnumpy(), np.log(a.asnumpy()), rtol=1e-5)
+        b.asnumpy(), np.power(np.log(a.asnumpy()), 2.0), rtol=1e-5)


 def test_add():
@@ -106,6 +106,6 @@ def test_add():


 if __name__ == "__main__":
-    test_log_llvm()
+    test_log_pow_llvm()
    test_exp()
    test_add()