Oneflow-Inc · oneflow-ci-bot · Jan 11, 2021 · Jan 6, 2021 · Jan 6, 2021 · Jan 6, 2021
diff --git a/oneflow/python/ops/math_binary_elementwise_ops.py b/oneflow/python/ops/math_binary_elementwise_ops.py
@@ -16,7 +16,7 @@
 from __future__ import absolute_import
 
 import os
-from typing import Optional
+from typing import Optional, Union
 
 import oneflow as flow
 import oneflow.python.framework.id_util as id_util
@@ -89,7 +89,9 @@ def atan2Job(x: tp.Numpy.Placeholder((3,),), y: tp.Numpy.Placeholder((3, ))
 
 @oneflow_export("math.pow")
 def pow(
-    x: oneflow_api.BlobDesc, y: oneflow_api.BlobDesc, name: Optional[str] = None
+    x: oneflow_api.BlobDesc,
+    y: Union[oneflow_api.BlobDesc, float],
+    name: Optional[str] = None,
 ) -> oneflow_api.BlobDesc:
     """This operator computes the Pow result. 
 
@@ -101,14 +103,16 @@ def pow(
 
     Args:
         x (oneflow_api.BlobDesc): A Blob
-        y (oneflow_api.BlobDesc): A Blob, the exponential factor of Pow
+        y (Union[oneflow_api.BlobDesc, float]): A Blob or float value, the exponential factor of Pow
         name (Optional[str], optional): The name for the operation. Defaults to None.
 
     Returns:
         oneflow_api.BlobDesc: The result Blob
 
     For example: 
 
+    Example 1: 
+
     .. code-block:: python
 
         import oneflow as flow
@@ -127,8 +131,44 @@ def powJob(x: tp.Numpy.Placeholder((3,), ), y: tp.Numpy.Placeholder((3,))
         out = powJob(x, y)
 
         # out [  4.  27. 256.]
+
+    Example 2: 
+
+    .. code-block:: python 
+
+        import oneflow as flow 
+        import oneflow.typing as tp 
+        import numpy as np 
+
+
+        @flow.global_function()
+        def scalar_pow_job(x: tp.Numpy.Placeholder(shape=(3, )))->tp.Numpy: 
+            with flow.scope.placement("cpu", "0:0"): 
+                out = flow.math.pow(x, 2.0)
+            return out 
+
+
+        x = np.array([1, 2, 3]).astype(np.float32)
+        out = scalar_pow_job(x)
+
+        # out [1. 4. 9.]
     """
-    return build_math_binary_elementwise_op("pow", x, y, name)
+    if name is None:
+        name = id_util.UniqueStr("Pow_")
+
+    if isinstance(y, (int, float)):
+        return (
+            flow.user_op_builder(name)
+            .Op("scalar_pow")
+            .Input("in", [x])
+            .Attr("exponent", float(y))
+            .Output("out")
+            .Build()
+            .InferAndTryRun()
+            .RemoteBlobList()[0]
+        )
+    else:
+        return build_math_binary_elementwise_op("pow", x, y, name)
 
 
 @oneflow_export("math.floordiv")

diff --git a/oneflow/python/test/ops/test_scalar_pow.py b/oneflow/python/test/ops/test_scalar_pow.py
@@ -0,0 +1,151 @@
+"""
+Copyright 2020 The OneFlow Authors. All rights reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+"""
+import oneflow as flow
+import numpy as np
+import oneflow.typing as tp
+from test_util import GenArgList
+import unittest
+from collections import OrderedDict
+from typing import Dict
+import os
+import random
+
+
+def _compare_scalar_pow_with_np(
+    input_shape, exponent, device_type, value_type, machine_ids, device_counts
+):
+    input_1 = np.random.uniform(0, 1, size=input_shape).astype(value_type[0])
+
+    assert device_type in ["cpu", "gpu"]
+
+    flow.clear_default_session()
+    if device_type == "cpu":
+        flow.config.cpu_device_num(device_counts)
+    else:
+        flow.config.gpu_device_num(device_counts)
+
+    func_config = flow.FunctionConfig()
+    func_config.default_placement_scope(flow.scope.placement(device_type, machine_ids))
+
+    func_config.default_data_type(value_type[1])
+
+    def np_pow(input, exponent):
+        out = np.power(input, exponent)
+        return np.array(out).astype(value_type[0])
+
+    np_out_pow = np_pow(input_1, exponent)
+
+    def np_diff(input, exponent):
+        diff = exponent * np.power(input, exponent - 1)
+        return diff
+
+    _np_grad = np_diff(input_1, exponent)
+
+    def assert_prediction_grad(blob: tp.Numpy):
+        assert np.allclose(blob, _np_grad, atol=1e-5)
+
+    @flow.global_function(
+        type="train", function_config=func_config,
+    )
+    def oneflow_pow(
+        of_input_1: tp.Numpy.Placeholder(shape=input_1.shape, dtype=value_type[1]),
+    ) -> tp.Numpy:
+        with flow.scope.placement(device_type, "0:0"):
+            v = flow.get_variable(
+                shape=input_1.shape,
+                dtype=value_type[1],
+                initializer=flow.zeros_initializer(),
+                name="x_var",
+            )
+            x_var = of_input_1 + v
+
+        flow.watch_diff(x_var, assert_prediction_grad)
+
+        of_pow_out = flow.math.pow(x_var, exponent)
+
+        with flow.scope.placement(device_type, "0:0"):
+            flow.optimizer.SGD(
+                flow.optimizer.PiecewiseConstantScheduler([], [1e-3]), momentum=0
+            ).minimize(of_pow_out)
+
+        return of_pow_out
+
+    of_out_pow = oneflow_pow(input_1)
+
+    assert np.allclose(of_out_pow, np_out_pow, atol=1e-5)
+
+
+def _gen_arg_dict(shape, exponent, device_type, value_type, machine_ids, device_counts):
+    # Generate a dict to pass parameter to test case
+    arg_dict = OrderedDict()
+    arg_dict["input_shape"] = [shape]
+    arg_dict["exponent"] = [exponent]
+    arg_dict["device_type"] = [device_type]
+    arg_dict["value_type"] = [
+        (np.float32, flow.float32),
+        (np.float64, flow.float64),
+    ]
+    arg_dict["machine_ids"] = [machine_ids]
+    arg_dict["device_counts"] = [device_counts]
+    return arg_dict
+
+
+@flow.unittest.skip_unless_1n1d()
+class TestScalarPow1n1d(flow.unittest.TestCase):
+    def test_scalar_pow_cpu(test_case):
+        arg_dict = _gen_arg_dict(
+            shape=(3, 3),
+            exponent=1.4,
+            device_type="cpu",
+            value_type="float",
+            machine_ids="0:0",
+            device_counts=1,
+        )
+        for arg in GenArgList(arg_dict):
+            _compare_scalar_pow_with_np(*arg)
+
+    @unittest.skipIf(os.getenv("ONEFLOW_TEST_CPU_ONLY"), "only test cpu cases")
+    def test_scalar_pow_gpu(test_case):
+        arg_dict = _gen_arg_dict(
+            shape=(4, 4),
+            exponent=2.3,
+            device_type="gpu",
+            value_type="float",
+            machine_ids="0:0",
+            device_counts=1,
+        )
+        for arg in GenArgList(arg_dict):
+            _compare_scalar_pow_with_np(*arg)
+
+
+@flow.unittest.skip_unless_1n2d()
+class TestScalarPow1n2d(flow.unittest.TestCase):
+    @unittest.skipIf(os.getenv("ONEFLOW_TEST_CPU_ONLY"), "only test cpu cases")
+    def test_pow_gpu_1n2d(test_case):
+        arg_dict = _gen_arg_dict(
+            shape=(4, 8, 4),
+            exponent=2.0,
+            device_type="gpu",
+            value_type="float",
+            machine_ids="0:0-1",
+            device_counts=2,
+        )
+        for arg in GenArgList(arg_dict):
+            _compare_scalar_pow_with_np(*arg)
+
+
+if __name__ == "__main__":
+    unittest.main()
diff --git a/oneflow/user/kernels/scalar_pow_kernel.cpp b/oneflow/user/kernels/scalar_pow_kernel.cpp
@@ -0,0 +1,87 @@
+/*
+Copyright 2020 The OneFlow Authors. All rights reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+*/
+#include "oneflow/core/framework/framework.h"
+#include "oneflow/core/common/data_type.h"
+
+namespace oneflow {
+
+namespace user_op {
+
+template<DeviceType device_type, typename T>
+class CpuScalarPowKernel final : public OpKernel {
+ public:
+  CpuScalarPowKernel() = default;
+  ~CpuScalarPowKernel() = default;
+
+ private:
+  void Compute(KernelComputeContext* ctx) const override {
+    const Tensor* in_tensor = ctx->Tensor4ArgNameAndIndex("in", 0);
+    Tensor* out_tensor = ctx->Tensor4ArgNameAndIndex("out", 0);
+    const T* in_ptr = in_tensor->dptr<T>();
+    T* out_ptr = out_tensor->mut_dptr<T>();
+    const T exponent = static_cast<T>(ctx->Attr<double>("exponent"));
+
+    const int64_t elem_cnt = in_tensor->shape().elem_cnt();
+    FOR_RANGE(int64_t, i, 0, elem_cnt) { out_ptr[i] = std::pow(in_ptr[i], exponent); }
+  }
+  bool AlwaysComputeWhenAllOutputsEmpty() const override { return false; }
+};
+
+#define REGISTER_CPU_SCALAR_POW_KERNEL(device, dtype)   \
+  REGISTER_USER_KERNEL("scalar_pow")                    \
+      .SetCreateFn<CpuScalarPowKernel<device, dtype>>() \
+      .SetIsMatchedHob((HobDeviceTag() == device)       \
+                       & (HobDataType("out", 0) == GetDataType<dtype>::value));
+
+REGISTER_CPU_SCALAR_POW_KERNEL(DeviceType::kCPU, float);
+REGISTER_CPU_SCALAR_POW_KERNEL(DeviceType::kCPU, double);
+
+template<DeviceType device_type, typename T>
+class CpuScalarPowGradKernel final : public OpKernel {
+ public:
+  CpuScalarPowGradKernel() = default;
+  ~CpuScalarPowGradKernel() = default;
+
+ private:
+  void Compute(KernelComputeContext* ctx) const override {
+    const Tensor* x_tensor = ctx->Tensor4ArgNameAndIndex("x", 0);
+    const Tensor* dy_tensor = ctx->Tensor4ArgNameAndIndex("dy", 0);
+    Tensor* dx_tensor = ctx->Tensor4ArgNameAndIndex("dx", 0);
+    const T* x_ptr = x_tensor->dptr<T>();
+    const T* dy_ptr = dy_tensor->dptr<T>();
+    T* dx_ptr = dx_tensor->mut_dptr<T>();
+    const T exponent = static_cast<T>(ctx->Attr<double>("exponent"));
+
+    const int32_t elem_cnt = x_tensor->shape().elem_cnt();
+    FOR_RANGE(int32_t, i, 0, elem_cnt) {
+      dx_ptr[i] = exponent * (std::pow(x_ptr[i], exponent - static_cast<T>(1))) * dy_ptr[i];
+    }
+  }
+  bool AlwaysComputeWhenAllOutputsEmpty() const override { return false; }
+};
+
+#define REGISTER_CPU_SCALAR_POW_GRAD_KERNEL(device, dtype)  \
+  REGISTER_USER_KERNEL("scalar_pow_grad")                   \
+      .SetCreateFn<CpuScalarPowGradKernel<device, dtype>>() \
+      .SetIsMatchedHob((HobDeviceTag() == device)           \
+                       & (HobDataType("dx", 0) == GetDataType<dtype>::value));
+
+REGISTER_CPU_SCALAR_POW_GRAD_KERNEL(DeviceType::kCPU, float);
+REGISTER_CPU_SCALAR_POW_GRAD_KERNEL(DeviceType::kCPU, double);
+
+}  // namespace user_op
+
+}  // namespace oneflow