summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorrander <rander.wang@intel.com>2017-03-31 11:07:02 +0800
committerYang Rong <rong.r.yang@intel.com>2017-04-17 16:08:49 +0800
commit06ed1ee4e238912a1b8f8c2e87c92875efa40c07 (patch)
treee2a613984170b5f46f0df3b892c6c5d4c71ee039
parent573153abb2cd0a25215ca68b1816eee5e13fb440 (diff)
backend: add double version of pown
convert pown to pow, pass the cft. And also there are some optimizations can be done, do it later Signed-off-by: rander <rander.wang@intel.com> Tested-by: Yang Rong <rong.r.yang@intel.com>
-rw-r--r--backend/src/libocl/tmpl/ocl_math_common.tmpl.cl18
-rw-r--r--backend/src/libocl/tmpl/ocl_math_common.tmpl.h1
2 files changed, 19 insertions, 0 deletions
diff --git a/backend/src/libocl/tmpl/ocl_math_common.tmpl.cl b/backend/src/libocl/tmpl/ocl_math_common.tmpl.cl
index dc6306c6..d55b972d 100644
--- a/backend/src/libocl/tmpl/ocl_math_common.tmpl.cl
+++ b/backend/src/libocl/tmpl/ocl_math_common.tmpl.cl
@@ -2348,6 +2348,24 @@ OVERLOADABLE double pow(double x, double y)
return __ocl_internal_pow(x, y);
}
+OVERLOADABLE double pown(double x, int n)
+{
+ int hx,hy,ix,iy;
+ unsigned lx,ly;
+
+ hx = __HI(x); lx = __LO(x);
+ ix = hx&0x7fffffff;
+
+ /* y==zero: x**0 = 1 */
+ if(n ==0) return 1.0;
+
+ /* +-NaN return x+y */
+ if(ix > 0x7ff00000 || ((ix==0x7ff00000)&&(lx!=0)))
+ return x+n;
+
+ return __ocl_internal_pow(x, n);
+}
+
OVERLOADABLE double remainder(double x, double p)
{
int hx,hp;
diff --git a/backend/src/libocl/tmpl/ocl_math_common.tmpl.h b/backend/src/libocl/tmpl/ocl_math_common.tmpl.h
index 9a75d00a..f5fa2897 100644
--- a/backend/src/libocl/tmpl/ocl_math_common.tmpl.h
+++ b/backend/src/libocl/tmpl/ocl_math_common.tmpl.h
@@ -58,6 +58,7 @@ OVERLOADABLE double mad(double a, double b, double c);
OVERLOADABLE double nan(ulong code);
OVERLOADABLE double nextafter(double x, double y);
OVERLOADABLE double pow(double x, double y);
+OVERLOADABLE double pown(double x, int n);
OVERLOADABLE double remainder(double x, double p);
OVERLOADABLE double rint(double x);
OVERLOADABLE double round(double x);