add the reciprocal function

6df1ecc9 · xuchen · e193b1c2 · 6df1ecc9 · 6df1ecc9 · 6df1ecc9
Commit 6df1ecc9 authored Mar 25, 2020 by xuchen
--- a/source/tensor/core/math/Unary.cpp
+++ b/source/tensor/core/math/Unary.cpp
@@ -68,6 +68,14 @@ T UnaryIsZero(T r)
    return (r == 0.0) ? (T)1.0 : (T)0.0;
 }
+template<class T>
+T UnaryReciprocal(T r)
+{
+    if (r == 0)
+        ShowNTErrors("Zero does not have reciprocal value.");
+    return (T)(1 / r);
+}
 /* define three marco separately, specify the respective function names */
 #ifdef USE_CUDA
 #define _SIMPLE_UNARY_FUNCTION(_funcName, _cudaFuncName, origFunc)                   \
@@ -186,6 +194,7 @@ _SIMPLE_UNARY_FUNCTION(_Square, _CudaSquare, UnarySquare)
 _SIMPLE_UNARY_FUNCTION(_Sin, _CudaSin, sin)
 _SIMPLE_UNARY_FUNCTION(_Cos, _CudaCos, cos)
 _SIMPLE_UNARY_FUNCTION(_Tan, _CudaTan, tan)
+_SIMPLE_UNARY_FUNCTION(_Reciprocal, _CudaReciprocal, UnaryReciprocal)
 #else
 _SIMPLE_UNARY_FUNCTION(_Absolute, fabs)
 _SIMPLE_UNARY_FUNCTION(_Ceil, ceil)
@@ -202,6 +211,7 @@ _SIMPLE_UNARY_FUNCTION(_Square, UnarySquare)
 _SIMPLE_UNARY_FUNCTION(_Sin, sin)
 _SIMPLE_UNARY_FUNCTION(_Cos, cos)
 _SIMPLE_UNARY_FUNCTION(_Tan, tan)
+_SIMPLE_UNARY_FUNCTION(_Reciprocal, UnaryReciprocal)
 #endif
 _SIMPLE_UNARY_FUNCTION_ME(_AbsoluteMe, _Absolute)
@@ -279,4 +289,9 @@ SIMPLE_UNARY_FUNCTION_ME(TanMe, _Tan)
 SIMPLE_UNARY_FUNCTION(Tan, _Tan, MATH_TAN)
 SIMPLE_UNARY_FUNCTION_VOID(Tan, _Tan, MATH_TAN)
+_SIMPLE_UNARY_FUNCTION_ME(_ReciprocalMe, _Reciprocal)
+SIMPLE_UNARY_FUNCTION_ME(ReciprocalMe, _Reciprocal)
+SIMPLE_UNARY_FUNCTION(Reciprocal, _Reciprocal, MATH_RECIPROCAL)
+SIMPLE_UNARY_FUNCTION_VOID(Reciprocal, _Reciprocal, MATH_RECIPROCAL)
 } // namespace nts(NiuTrans.Tensor)
\ No newline at end of file
--- a/source/tensor/core/math/Unary.cu
+++ b/source/tensor/core/math/Unary.cu
@@ -142,6 +142,15 @@ T UnaryCudaTan(T x)
    return (T)tan((float)x);
 }
+template<class T>
+__device__
+T UnaryCudaReciprocal(T x)
+{
+    //if (x == 0)
+        //ShowNTErrors("Zero does not have reciprocal value.");
+    return (T)(1 / x);
+}
 #define SIMPLE_UNARY_FUNCTION_GPU(funcName, origFunc)                       \
 template<class T>                                                           \
@@ -155,7 +164,7 @@ void Kernel##funcName(T * a, T * b, int size)                               \
 }                                                                           \
 void _Cuda##funcName(const XTensor * a, XTensor * b)                        \
 {                                                                           \
-    CheckNTErrors((_IsSameShaped(a, b)),                            \
+    CheckNTErrors((_IsSameShaped(a, b)),                                    \
                  "Input tensors should have the same type!");              \
    CheckNTErrors(a->isSparse == false, "TODO!");                           \
                                                                            \
@@ -208,6 +217,8 @@ SIMPLE_UNARY_FUNCTION_GPU(Sin, UnaryCudaSin)
 SIMPLE_UNARY_FUNCTION_GPU(Cos, UnaryCudaCos)
 SIMPLE_UNARY_FUNCTION_GPU(Tan, UnaryCudaTan)
+SIMPLE_UNARY_FUNCTION_GPU(Reciprocal, UnaryCudaReciprocal)
 #endif // USE_CUDA
 } // namespace nts(NiuTrans.Tensor)
\ No newline at end of file
--- a/source/tensor/core/math/Unary.cuh
+++ b/source/tensor/core/math/Unary.cuh
@@ -75,6 +75,9 @@ void _CudaCos(const XTensor * a, XTensor * b);
 /* set each entry to its tangent value */
 void _CudaTan(const XTensor * a, XTensor * b);
+/* set each entry to its reciprocal value */
+void _CudaReciprocal(const XTensor * a, XTensor * b);
 #endif // USE_CUDA
 } // namespace nts(NiuTrans.Tensor)

--- a/source/tensor/core/math/Unary.h
+++ b/source/tensor/core/math/Unary.h
@@ -236,6 +236,20 @@ XTensor Tan(const XTensor & a);
 /* set every entry to its tangent value */
 void Tan(const XTensor & a, XTensor & b);
+/* set every entry to its reciprocal value */
+void _Reciprocal(const XTensor * a, XTensor * b);
+/* set every entry to its reciprocal value (do it on site)
+keep the result in the input tensor a and return nothing */
+void _ReciprocalMe(XTensor * a);
+/* set every entry to its reciprocal value (do it on site)
+keep the result in the input tensor a and return nothing */
+void ReciprocalMe(XTensor & a);
+/* set every entry to its reciprocal value (return an XTensor structure)
+make a new tensor to keep the result and return it */
+XTensor Reciprocal(const XTensor & a);
+/* set every entry to its reciprocal value */
+void Reciprocal(const XTensor & a, XTensor & b);
 } // namespace nts(NiuTrans.Tensor)
 #endif // end __UNARY_H__
\ No newline at end of file