change the header files to be compatible with the new organized stim/cuda direct…

…ory , and add the stim/cude/ivote subdirectory that includes the ivote related functions

change the header files to be compatible with the new organized stim/cuda direct…
…ory , and add the stim/cude/ivote subdirectory that includes the ivote related functions
Laila Saadatifard
1 parent 5cc0976c
Showing 13 changed files with 31 additions and 110 deletions Show diff stats
stim/cuda/arraymath/array_add.cuh
stim/cuda/arraymath/array_multiply.cuh
stim/cuda/gaussian_blur.cuh
stim/cuda/ivote.cuh
stim/cuda/down_sample.cuh → stim/cuda/ivote/down_sample.cuh
stim/cuda/local_max.cuh → stim/cuda/ivote/local_max.cuh
stim/cuda/update_dir.cuh → stim/cuda/ivote/update_dir.cuh
stim/cuda/vote.cuh → stim/cuda/ivote/vote.cuh
stim/cuda/templates/conv2.cuh
stim/cuda/templates/gaussian_blur.cuh
stim/cuda/templates/gradient.cuh
stim/image/image.h
stim/math/vector.h
@@ -3,8 +3,7 @@
 #include <iostream>
 #include <cuda.h>
-#include <stim/cuda/devices.h>
-#include <stim/cuda/error.h>
+#include <stim/cuda/cudatools.h>
 namespace stim{
 	namespace cuda{
@@ -3,8 +3,7 @@
 #include <iostream>
 #include <cuda.h>
-#include <stim/cuda/devices.h>
-#include <stim/cuda/error.h>
+#include <stim/cuda/cudatools.h>
 namespace stim{
 	namespace cuda{
-#ifndef STIM_CUDA_GAUSSIAN_BLUR_H
-#define STIM_CUDA_GAUSSIAN_BLUR_H
-
-#include <iostream>
-#include <cuda.h>
-#include <stim/cuda/cudatools.h>
-#include <stim/cuda/sharedmem.cuh>
-#include <stim/cuda/templates/conv2sep.cuh>		//GPU-based separable convolution algorithm
-
-#define pi	3.14159
-
-namespace stim{
-	namespace cuda{
-
-		template<typename T>
-		void gen_gaussian(T* out, T sigma, unsigned int width){
-
-			//fill the kernel with a gaussian
-			for(unsigned int xi = 0; xi < width; xi++){
-
-				float x = (float)xi - (float)(width/2);	//calculate the x position of the gaussian
-				float g = 1.0 / (sigma * sqrt(2 * 3.14159)) * exp( - (x*x) / (2*sigma*sigma) );
-				out[xi] = g;
-			}
-
-		}
-
-		template<typename T>
-		void tex_gaussian_blur2(T* out, T sigma, unsigned int x, unsigned int y, cudaTextureObject_t texObj, cudaArray* cuArray){
-
-			//allocate space for the kernel
-			unsigned int kwidth = sigma * 8 + 1;
-			float* kernel0 = (float*) malloc( kwidth * sizeof(float) );
-
-			//fill the kernel with a gaussian
-			gen_gaussian(kernel0, sigma, kwidth);
-
-			//copy the kernel to the GPU
-			T* gpuKernel0;
-			HANDLE_ERROR(cudaMemcpy(gpuKernel0, kernel0, kwidth * sizeof(T), cudaMemcpyHostToDevice));
-
-			//perform the gaussian blur as a separable convolution
-			stim::cuda::tex_conv2sep(out, x, y, texObj, cuArray, gpuKernel0, kwidth, gpuKernel0, kwidth);
-
-			HANDLE_ERROR(cudaFree(gpuKernel0));
-
-		}
-
-		template<typename T>
-		void gpu_gaussian_blur2(T* image, T sigma, unsigned int x, unsigned int y){
-
-			//allocate space for the kernel
-			unsigned int kwidth = sigma * 8 + 1;
-			float* kernel0 = (float*) malloc( kwidth * sizeof(float) );
-
-			//fill the kernel with a gaussian
-			gen_gaussian(kernel0, sigma, kwidth);
-
-			//copy the kernel to the GPU
-			T* gpuKernel0;
-			HANDLE_ERROR(cudaMemcpy(gpuKernel0, kernel0, kwidth * sizeof(T), cudaMemcpyHostToDevice));
-
-			//perform the gaussian blur as a separable convolution
-			stim::cuda::gpu_conv2sep<float>(image, x, y, gpuKernel0, kwidth, gpuKernel0, kwidth);
-
-			HANDLE_ERROR(cudaFree(gpuKernel0));
-
-		}
-
-		/// Applies a Gaussian blur to a 2D image stored on the CPU
-		template<typename T>
-		void cpu_gaussian_blur2(T* image, T sigma, unsigned int x, unsigned int y){
-
-			//allocate space for the kernel
-			unsigned int kwidth = sigma * 8 + 1;
-			float* kernel0 = (float*) malloc( kwidth * sizeof(float) );
-
-			//fill the kernel with a gaussian
-			gen_gaussian(kernel0, sigma, kwidth);
-
-			//perform the gaussian blur as a separable convolution
-			stim::cuda::cpu_conv2sep<float>(image, x, y, kernel0, kwidth, kernel0, kwidth);
-			
-		}
-		
-	};
-};
-
-#endif
 \ No newline at end of file
+#ifndef STIM_CUDA_IVOTE_H
+#define STIM_CUDA_IVOTE_H
+
+#include <stim/cuda/ivote/down_sample.cuh>
+#include <stim/cuda/ivote/local_max.cuh>
+#include <stim/cuda/ivote/update_dir.cuh>
+#include <stim/cuda/ivote/vote.cuh>
+
+namespace stim{
+	namespace cuda{
+	
+	}
+}
+
+
+
+#endif
 \ No newline at end of file
@@ -3,9 +3,8 @@
 #include <iostream>
 #include <cuda.h>
-#include <stim/cuda/devices.h>
-#include <stim/cuda/timer.h>
-#include <stim/cuda/gaussian_blur.cuh>
+#include <stim/cuda/cudatools.h>
+#include <stim/cuda/templates/gaussian_blur.cuh>
 namespace stim{
 	namespace cuda{
@@ -51,7 +50,7 @@ namespace stim{
 			dim3 threads(max_threads, 1);
 			dim3 blocks(x_ds/threads.x + (x_ds %threads.x == 0 ? 0:1) , y_ds);
-			stim::cuda::gpu_gaussian_blur_2d<float>(gpuI0, sigma_ds,x ,y);
+			stim::cuda::gpu_gaussian_blur2<float>(gpuI0, sigma_ds,x ,y);
 			//resample the image
 			down_sample<float> <<< blocks, threads >>>(gpuI, gpuI0, resize, x, y);
@@ -4,8 +4,7 @@
 # include <iostream>
 # include <cuda.h>
-# include <stim/cuda/devices.h>
-# include <stim/cuda/error.h>
+#include <stim/cuda/cudatools.h>
 namespace stim{
 	namespace cuda{
@@ -4,8 +4,7 @@
 # include <iostream>
 # include <cuda.h>
-# include <stim/cuda/devices.h>
-# include <stim/cuda/error.h>
+#include <stim/cuda/cudatools.h>
 #include <stim/cuda/sharedmem.cuh>
 namespace stim{
@@ -4,8 +4,7 @@
 # include <iostream>
 # include <cuda.h>
-# include <stim/cuda/devices.h>
-# include <stim/cuda/error.h>
+#include <stim/cuda/cudatools.h>
 #include <stim/cuda/sharedmem.cuh>
@@ -3,8 +3,7 @@
 #include <iostream>
 #include <cuda.h>
-#include <stim/cuda/devices.h>
-#include <stim/cuda/error.h>
+#include <stim/cuda/cudatools.h>
 #include <cmath>
 #include <algorithm>
@@ -58,6 +58,7 @@ namespace stim{
 			//copy the kernel to the GPU
 			T* gpuKernel0;
+			HANDLE_ERROR(cudaMalloc(&gpuKernel0, kwidth * sizeof(T)));
 			HANDLE_ERROR(cudaMemcpy(gpuKernel0, kernel0, kwidth * sizeof(T), cudaMemcpyHostToDevice));
 			//perform the gaussian blur as a separable convolution
@@ -3,8 +3,7 @@
 #include <iostream>
 #include <cuda.h>
-#include <stim/cuda/devices.h>
-#include <stim/cuda/error.h>
+#include <stim/cuda/cudatools.h>
 namespace stim{
 	namespace cuda{
@@ -174,7 +174,7 @@ public:
 	/// Returns the maximum pixel value in the image
-	T max(){
+	T maxv(){
 		float max = 0;
 		unsigned long N = width() * height();		//get the number of pixels
@@ -190,7 +190,7 @@ public:
 	}
 	/// Returns the minimum pixel value in the image
-	T min(){
+	T minv(){
 		float min = 0;
 		unsigned long N = width() * height();		//get the number of pixels
@@ -5,7 +5,7 @@
 #include <cmath>
 #include <sstream>
 #include <vector>
-#include "../cuda/callable.h"
+#include "../cuda/cudatools/callable.h"
 namespace stim
 {