[clfft] 36/74: making the twiddles work in FFT kernels, twiddle in transpose is broken
Ghislain Vaillant
ghisvail-guest at moszumanska.debian.org
Thu Jan 14 19:52:15 UTC 2016
This is an automated email from the git hooks/post-receive script.
ghisvail-guest pushed a commit to branch debian/sid
in repository clfft.
commit 755948af793305a555169d854972ae5c0d06fe54
Author: bragadeesh <bragadeesh.natarajan at amd>
Date: Mon Dec 7 18:12:24 2015 -0800
making the twiddles work in FFT kernels, twiddle in transpose is broken
---
src/library/plan.cpp | 11 ++++++++++-
1 file changed, 10 insertions(+), 1 deletion(-)
diff --git a/src/library/plan.cpp b/src/library/plan.cpp
index 1519ea0..c018e78 100644
--- a/src/library/plan.cpp
+++ b/src/library/plan.cpp
@@ -774,7 +774,10 @@ clfftStatus clfftBakePlan( clfftPlanHandle plHandle, cl_uint numQueues, cl_comma
trans2Plan->iDist = fftPlan->oDist;
trans2Plan->oDist = clLengths[1] * trans2Plan->outStride[1];
trans2Plan->gen = transGen;
- trans2Plan->large1D = fftPlan->length[0];
+
+ if(transGen != Transpose_NONSQUARE)
+ trans2Plan->large1D = fftPlan->length[0];
+
trans2Plan->transflag = true;
for (size_t index = 1; index < fftPlan->length.size(); index++)
@@ -828,6 +831,12 @@ clfftStatus clfftBakePlan( clfftPlanHandle plHandle, cl_uint numQueues, cl_comma
row2Plan->oDist *= fftPlan->length[index];
}
+ if (transGen == Transpose_NONSQUARE)
+ {
+ row2Plan->large1D = fftPlan->length[0];
+ row2Plan->twiddleFront = true;
+ }
+
OPENCL_V(clfftBakePlan(fftPlan->planY, numQueues, commQueueFFT, NULL, NULL ),
_T( "BakePlan large1d second row plan failed" ) );
--
Alioth's /usr/local/bin/git-commit-notice on /srv/git.debian.org/git/debian-science/packages/clfft.git
More information about the debian-science-commits
mailing list