[clfft] 35/128: fixing INPLACE addition framework code, gen work to follow next

Ghislain Vaillant ghisvail-guest at moszumanska.debian.org
Thu Oct 22 14:54:35 UTC 2015


This is an automated email from the git hooks/post-receive script.

ghisvail-guest pushed a commit to branch master
in repository clfft.

commit 15be25dd11f5045ff403ec4fe05b9db7fea53631
Author: bragadeesh <bragadeesh.natarajan at amd>
Date:   Fri Aug 21 11:52:33 2015 -0500

    fixing INPLACE addition framework code, gen work to follow next
---
 src/library/plan.cpp | 15 +++++++++------
 1 file changed, 9 insertions(+), 6 deletions(-)

diff --git a/src/library/plan.cpp b/src/library/plan.cpp
index 084cf72..390049d 100644
--- a/src/library/plan.cpp
+++ b/src/library/plan.cpp
@@ -648,7 +648,7 @@ clfftStatus	clfftBakePlan( clfftPlanHandle plHandle, cl_uint numQueues, cl_comma
 					trans1Plan->outStride[1]  = clLengths[1] + padding;
 					trans1Plan->iDist         = fftPlan->iDist;
 					trans1Plan->oDist         = clLengths[0] * trans1Plan->outStride[1];
-					trans1Plan->gen           = Transpose_GCN;
+					trans1Plan->gen           = Transpose_INPLACE;
 					trans1Plan->transflag     = true;
 
 					OPENCL_V(clfftBakePlan(fftPlan->planTX, numQueues, commQueueFFT, NULL, NULL ),
@@ -714,7 +714,7 @@ clfftStatus	clfftBakePlan( clfftPlanHandle plHandle, cl_uint numQueues, cl_comma
 					trans2Plan->outStride[1]  = clLengths[0] + padding;
 					trans2Plan->iDist         = fftPlan->oDist;
 					trans2Plan->oDist         = clLengths[1] * trans2Plan->outStride[1];
-                    trans2Plan->gen           = Transpose_GCN;
+                    trans2Plan->gen           = Transpose_INPLACE;
 					trans2Plan->large1D			= fftPlan->length[0];
 					trans2Plan->transflag     = true;
 
@@ -778,7 +778,7 @@ clfftStatus	clfftBakePlan( clfftPlanHandle plHandle, cl_uint numQueues, cl_comma
 					trans3Plan->outStride[1]  = clLengths[1];
 					trans3Plan->iDist         = clLengths[1] * trans3Plan->inStride[1];
 					trans3Plan->oDist         = fftPlan->oDist;
-                    trans3Plan->gen           = Transpose_GCN;
+                    trans3Plan->gen           = Transpose_INPLACE;
 					trans3Plan->transflag     = true;
 					trans3Plan->transOutHorizontal = true;
 
@@ -1754,6 +1754,8 @@ clfftStatus	clfftBakePlan( clfftPlanHandle plHandle, cl_uint numQueues, cl_comma
                 clfftStatus err;
 				if(fftPlan->gen == Transpose_GCN)
 					fftPlan->action = new FFTGeneratedTransposeGCNAction(plHandle, fftPlan, *commQueueFFT, err);
+				else if(fftPlan->gen == Transpose_INPLACE)
+					fftPlan->action = new FFTGeneratedTransposeInplaceAction(plHandle, fftPlan, *commQueueFFT, err);
 				else
 					fftPlan->action = new FFTGeneratedTransposeVLIWAction(plHandle, fftPlan, *commQueueFFT, err);
                 OPENCL_V( err, "FFTGeneratedTransposeVLIWAction failed");
@@ -3966,9 +3968,10 @@ clfftStatus FFTPlan::GetMax1DLength (size_t *longest ) const
 	{
 	case Stockham:		return GetMax1DLengthStockham(longest);
 	//No restriction for Transpose_VLIW kernel
-	case Transpose_VLIW:     *longest = 4096; return CLFFT_SUCCESS;
-    case Transpose_GCN:     *longest = 4096; return CLFFT_SUCCESS;
-    case Copy:			*longest = 4096; return CLFFT_SUCCESS;
+	case Transpose_VLIW:		*longest = 4096; return CLFFT_SUCCESS;
+    case Transpose_GCN:			*longest = 4096; return CLFFT_SUCCESS;
+    case Transpose_INPLACE:     *longest = 4096; return CLFFT_SUCCESS;
+    case Copy:					*longest = 4096; return CLFFT_SUCCESS;
 	default:			assert(false); return CLFFT_NOTIMPLEMENTED;
 	}
 }

-- 
Alioth's /usr/local/bin/git-commit-notice on /srv/git.debian.org/git/debian-science/packages/clfft.git



More information about the debian-science-commits mailing list