[arrayfire] 30/284: converted transform to async call

Sun Feb 7 18:59:16 UTC 2016

This is an automated email from the git hooks/post-receive script.

ghisvail-guest pushed a commit to branch debian/experimental
in repository arrayfire.

commit 32a65d8f390e2893ba91ef6742365f9fd8e7c3c4
Author: pradeep <pradeep at arrayfire.com>
Date:   Fri Nov 20 16:58:13 2015 -0500

    converted transform to async call
---
 src/backend/cpu/transform.cpp | 230 +++++++++++++++++++++---------------------
 1 file changed, 116 insertions(+), 114 deletions(-)

diff --git a/src/backend/cpu/transform.cpp b/src/backend/cpu/transform.cpp
index 68e8d96..f4a0514 100644
--- a/src/backend/cpu/transform.cpp
+++ b/src/backend/cpu/transform.cpp
@@ -12,136 +12,138 @@
 #include <math.hpp>
 #include <stdexcept>
 #include <err_cpu.hpp>
+#include <platform.hpp>
+#include <async_queue.hpp>
 #include "transform_interp.hpp"
 
 namespace cpu
 {
-    template <typename T>
-    void calc_affine_inverse(T *txo, const T *txi)
-    {
-        T det = txi[0]*txi[4] - txi[1]*txi[3];
-
-        txo[0] = txi[4] / det;
-        txo[1] = txi[3] / det;
-        txo[3] = txi[1] / det;
-        txo[4] = txi[0] / det;
-
-        txo[2] = txi[2] * -txo[0] + txi[5] * -txo[1];
-        txo[5] = txi[2] * -txo[3] + txi[5] * -txo[4];
-    }
 
-    template <typename T>
-    void calc_affine_inverse(T *tmat, const T *tmat_ptr, const bool inverse)
-    {
-        // The way kernel is structured, it expects an inverse
-        // transform matrix by default.
-        // If it is an forward transform, then we need its inverse
-        if(inverse) {
-            for(int i = 0; i < 6; i++)
-                tmat[i] = tmat_ptr[i];
-        } else {
-            calc_affine_inverse(tmat, tmat_ptr);
-        }
+template <typename T>
+void calc_affine_inverse(T *txo, const T *txi)
+{
+    T det = txi[0]*txi[4] - txi[1]*txi[3];
+
+    txo[0] = txi[4] / det;
+    txo[1] = txi[3] / det;
+    txo[3] = txi[1] / det;
+    txo[4] = txi[0] / det;
+
+    txo[2] = txi[2] * -txo[0] + txi[5] * -txo[1];
+    txo[5] = txi[2] * -txo[3] + txi[5] * -txo[4];
+}
+
+template <typename T>
+void calc_affine_inverse(T *tmat, const T *tmat_ptr, const bool inverse)
+{
+    // The way kernel is structured, it expects an inverse
+    // transform matrix by default.
+    // If it is an forward transform, then we need its inverse
+    if(inverse) {
+        for(int i = 0; i < 6; i++)
+            tmat[i] = tmat_ptr[i];
+    } else {
+        calc_affine_inverse(tmat, tmat_ptr);
     }
+}
 
-    template<typename T, af_interp_type method>
-    void transform_(T *out, const T *in, const float *tf,
-                    const af::dim4 &odims, const af::dim4 &idims,
-                    const af::dim4 &ostrides, const af::dim4 &istrides,
-                    const af::dim4 &tstrides, const bool inverse)
-    {
-        dim_t nimages     = idims[2];
-        // Multiplied in src/backend/transform.cpp
-        dim_t ntransforms = odims[2] / idims[2];
-
-        void (*t_fn)(T *, const T *, const float *, const af::dim4 &,
-                     const af::dim4 &, const af::dim4 &,
-                     const dim_t, const dim_t, const dim_t, const dim_t);
-
-        switch(method) {
-            case AF_INTERP_NEAREST:
-                t_fn = &transform_n;
-                break;
-            case AF_INTERP_BILINEAR:
-                t_fn = &transform_b;
-                break;
-            case AF_INTERP_LOWER:
-                t_fn = &transform_l;
-                break;
-            default:
-                AF_ERROR("Unsupported interpolation type", AF_ERR_ARG);
-                break;
-        }
+template<typename T, af_interp_type method>
+void transform_(Array<T> output, const Array<T> input,
+                const Array<float> transform, const bool inverse)
+{
+    const af::dim4 idims    = input.dims();
+    const af::dim4 odims    = output.dims();
+    const af::dim4 istrides = input.strides();
+    const af::dim4 ostrides = output.strides();
+
+    T * out = output.get();
+    const T * in = input.get();
+    const float* tf = transform.get();
+
+    dim_t nimages     = idims[2];
+    // Multiplied in src/backend/transform.cpp
+    dim_t ntransforms = odims[2] / idims[2];
+
+    void (*t_fn)(T *, const T *, const float *, const af::dim4 &,
+                 const af::dim4 &, const af::dim4 &,
+                 const dim_t, const dim_t, const dim_t, const dim_t);
+
+    switch(method) {
+        case AF_INTERP_NEAREST:
+            t_fn = &transform_n;
+            break;
+        case AF_INTERP_BILINEAR:
+            t_fn = &transform_b;
+            break;
+        case AF_INTERP_LOWER:
+            t_fn = &transform_l;
+            break;
+        default:
+            AF_ERROR("Unsupported interpolation type", AF_ERR_ARG);
+            break;
+    }
 
 
-        // For each transform channel
-        for(int t_idx = 0; t_idx < (int)ntransforms; t_idx++) {
-            // Compute inverse if required
-            const float *tmat_ptr = tf + t_idx * 6;
-            float tmat[6];
-            calc_affine_inverse(tmat, tmat_ptr, inverse);
+    // For each transform channel
+    for(int t_idx = 0; t_idx < (int)ntransforms; t_idx++) {
+        // Compute inverse if required
+        const float *tmat_ptr = tf + t_idx * 6;
+        float tmat[6];
+        calc_affine_inverse(tmat, tmat_ptr, inverse);
 
-            // Offset for output pointer
-            dim_t o_offset = t_idx * nimages * ostrides[2];
+        // Offset for output pointer
+        dim_t o_offset = t_idx * nimages * ostrides[2];
 
-            // Do transform for image
-            for(int yy = 0; yy < (int)odims[1]; yy++) {
-                for(int xx = 0; xx < (int)odims[0]; xx++) {
-                    t_fn(out, in, tmat, idims, ostrides, istrides, nimages, o_offset, xx, yy);
-                }
+        // Do transform for image
+        for(int yy = 0; yy < (int)odims[1]; yy++) {
+            for(int xx = 0; xx < (int)odims[0]; xx++) {
+                t_fn(out, in, tmat, idims, ostrides, istrides, nimages, o_offset, xx, yy);
             }
         }
     }
+}
 
-    template<typename T>
-    Array<T> transform(const Array<T> &in, const Array<float> &transform, const af::dim4 &odims,
-                        const af_interp_type method, const bool inverse)
-    {
-        const af::dim4 idims = in.dims();
-
-        Array<T> out = createEmptyArray<T>(odims);
-
-        switch(method) {
-            case AF_INTERP_NEAREST:
-                transform_<T, AF_INTERP_NEAREST>
-                          (out.get(), in.get(), transform.get(), odims, idims,
-                           out.strides(), in.strides(), transform.strides(), inverse);
-                break;
-            case AF_INTERP_BILINEAR:
-                transform_<T, AF_INTERP_BILINEAR>
-                          (out.get(), in.get(), transform.get(), odims, idims,
-                           out.strides(), in.strides(), transform.strides(), inverse);
-                break;
-            case AF_INTERP_LOWER:
-                transform_<T, AF_INTERP_LOWER>
-                          (out.get(), in.get(), transform.get(), odims, idims,
-                           out.strides(), in.strides(), transform.strides(), inverse);
-                break;
-            default:
-                AF_ERROR("Unsupported interpolation type", AF_ERR_ARG);
-                break;
-        }
-
-        return out;
+template<typename T>
+Array<T> transform(const Array<T> &in, const Array<float> &transform, const af::dim4 &odims,
+                    const af_interp_type method, const bool inverse)
+{
+    Array<T> out = createEmptyArray<T>(odims);
+    in.eval();
+
+    switch(method) {
+        case AF_INTERP_NEAREST :
+            getQueue().enqueue(transform_<T, AF_INTERP_NEAREST >, out, in, transform, inverse);
+            break;
+        case AF_INTERP_BILINEAR:
+            getQueue().enqueue(transform_<T, AF_INTERP_BILINEAR>, out, in, transform, inverse);
+            break;
+        case AF_INTERP_LOWER   :
+            getQueue().enqueue(transform_<T, AF_INTERP_LOWER   >, out, in, transform, inverse);
+            break;
+        default: AF_ERROR("Unsupported interpolation type", AF_ERR_ARG); break;
     }
 
+    return out;
+}
+
+
+#define INSTANTIATE(T)                                                              \
+template Array<T> transform(const Array<T> &in, const Array<float> &transform,      \
+                            const af::dim4 &odims, const af_interp_type method,     \
+                            const bool inverse);
+
+
+INSTANTIATE(float)
+INSTANTIATE(double)
+INSTANTIATE(cfloat)
+INSTANTIATE(cdouble)
+INSTANTIATE(int)
+INSTANTIATE(uint)
+INSTANTIATE(intl)
+INSTANTIATE(uintl)
+INSTANTIATE(uchar)
+INSTANTIATE(char)
+INSTANTIATE(short)
+INSTANTIATE(ushort)
 
-#define INSTANTIATE(T)                                                                  \
-    template Array<T> transform(const Array<T> &in, const Array<float> &transform,      \
-                                const af::dim4 &odims, const af_interp_type method,     \
-                                const bool inverse);
-
-
-    INSTANTIATE(float)
-    INSTANTIATE(double)
-    INSTANTIATE(cfloat)
-    INSTANTIATE(cdouble)
-    INSTANTIATE(int)
-    INSTANTIATE(uint)
-    INSTANTIATE(intl)
-    INSTANTIATE(uintl)
-    INSTANTIATE(uchar)
-    INSTANTIATE(char)
-    INSTANTIATE(short)
-    INSTANTIATE(ushort)
 }

-- 
Alioth's /usr/local/bin/git-commit-notice on /srv/git.debian.org/git/debian-science/packages/arrayfire.git