codebase / stimlib

Browse Code »

Commit ad2123e6f9eb1be476fccb05626ce7aaa24d502d

Authored by David Mayerich 2016-06-15 12:52:04 -0500

2 parents 0c9d37c7 3a74ec6d

Merge branch 'master' of git.stim.ee.uh.edu:codebase/stimlib

Showing 3 changed files with 336 additions and 0 deletions Show diff stats

Inline Side-by-side

stim/math/fft.h 0 → 100644

Wrap text Show/Hide comments View file @ad2123e

	1	+#ifndef STIM_FFT_H
	2	+#define STIM_FFT_H
	3	+
	4	+namespace stim{
	5	+
	6	+ template<class T>
	7	+ void circshift(T out, const T in, size_t xdim, size_t ydim, size_t xshift, size_t yshift){
	8	+ size_t i, j, ii, jj;
	9	+ for (i =0; i < xdim; i++) {
	10	+ ii = (i + xshift) % xdim;
	11	+ for (j = 0; j < ydim; j++) {
	12	+ jj = (j + yshift) % ydim;
	13	+ out[ii * ydim + jj] = in[i * ydim + j];
	14	+ }
	15	+ }
	16	+ }
	17	+
	18	+ template<typename T>
	19	+ void cpu_fftshift(T* out, T* in, size_t xdim, size_t ydim){
	20	+ circshift(out, in, xdim, ydim, xdim/2, ydim/2);
	21	+ }
	22	+
	23	+ template<typename T>
	24	+ void cpu_ifftshift(T* out, T* in, size_t xdim, size_t ydim){
	25	+ circshift(out, in, xdim, ydim, xdim/2, ydim/2);
	26	+ }
	27	+
	28	+
	29	+}
	30	+
	31	+#endif
0	32	\ No newline at end of file
...	...

stim/optics/lens.h 0 → 100644

Wrap text Show/Hide comments View file @ad2123e

	1	+#ifndef STIM_LENS_H
	2	+#define STIM_LENS_H
	3	+
	4	+#include "scalarwave.h"
	5	+#include "../math/bessel.h"
	6	+#include "../cuda/cudatools/devices.h"
	7	+#include "../visualization/colormap.h"
	8	+#include "../math/fft.h"
	9	+
	10	+#include "cufft.h"
	11	+
	12	+#include <cmath>
	13	+
	14	+namespace stim{
	15	+
	16	+ /// Perform a k-space transform of a scalar field (FFT). The given field has a width of x and the calculated momentum space has a
	17	+ /// width of kx (in radians).
	18	+ /// @param K is a pointer to the output array of all plane waves in the field
	19	+ /// @param kx is the width of the frame in momentum space
	20	+ /// @param ky is the height of the frame in momentum space
	21	+ /// @param E is the field to be transformed
	22	+ /// @param x is the width of the field in the spatial domain
	23	+ /// @param y is the height of the field in the spatial domain
	24	+ /// @param nx is the number of pixels representing the field in the x (and kx) direction
	25	+ /// @param ny is the number of pixels representing the field in the y (and ky) direction
	26	+ template<typename T>
	27	+ void cpu_scalar_to_kspace(stim::complex<T>* K, T& kx, T& ky, stim::complex<T>* E, T x, T y, size_t nx, size_t ny){
	28	+
	29	+ kx = stim::TAU * nx / x; //calculate the width of the momentum space
	30	+ ky = stim::TAU * ny / y;
	31	+
	32	+ stim::complex<T>* dev_FFT;
	33	+ HANDLE_ERROR( cudaMalloc(&dev_FFT, sizeof(stim::complex<T>) * nx * ny) ); //allocate space on the CUDA device for the output array
	34	+
	35	+ stim::complex<T>* dev_E;
	36	+ HANDLE_ERROR( cudaMalloc(&dev_E, sizeof(stim::complex<T>) * nx * ny) ); //allocate space for the field
	37	+ HANDLE_ERROR( cudaMemcpy(dev_E, E, sizeof(stim::complex<T>) * nx * ny, cudaMemcpyHostToDevice) ); //copy the field to GPU memory
	38	+
	39	+ cufftResult result;
	40	+ cufftHandle plan;
	41	+ result = cufftPlan2d(&plan, nx, ny, CUFFT_C2C);
	42	+ if(result != CUFFT_SUCCESS){
	43	+ std::cout<<"Error creating cuFFT plan."<<std::endl;
	44	+ exit(1);
	45	+ }
	46	+
	47	+ result = cufftExecC2C(plan, (cufftComplex)dev_E, (cufftComplex)dev_FFT, CUFFT_FORWARD);
	48	+ if(result != CUFFT_SUCCESS){
	49	+ std::cout<<"Error using cuFFT to perform a forward Fourier transform of the field."<<std::endl;
	50	+ exit(1);
	51	+ }
	52	+
	53	+ stim::complex<T>* fft = (stim::complex<T>) malloc(sizeof(stim::complex<T>) nx * ny);
	54	+ HANDLE_ERROR( cudaMemcpy(fft, dev_FFT, sizeof(stim::complex<T>) * nx * ny, cudaMemcpyDeviceToHost) );
	55	+
	56	+ stim::cpu_fftshift(K, fft, nx, ny);
	57	+ }
	58	+
	59	+ template<typename T>
	60	+ void cpu_scalar_from_kspace(stim::complex<T>* E, T& x, T& y, stim::complex<T>* K, T kx, T ky, size_t nx, size_t ny){
	61	+
	62	+ x = stim::TAU * nx / kx; //calculate the width of the momentum space
	63	+ y = stim::TAU * ny / ky;
	64	+
	65	+ stim::complex<T>* fft = (stim::complex<T>) malloc(sizeof(stim::complex<T>) nx * ny);
	66	+ stim::cpu_ifftshift(fft, K, nx, ny);
	67	+
	68	+ stim::complex<T>* dev_FFT;
	69	+ HANDLE_ERROR( cudaMalloc(&dev_FFT, sizeof(stim::complex<T>) * nx * ny) ); //allocate space on the CUDA device for the output array
	70	+ HANDLE_ERROR( cudaMemcpy(dev_FFT, fft, sizeof(stim::complex<T>) * nx * ny, cudaMemcpyHostToDevice) ); //copy the field to GPU memory
	71	+
	72	+ stim::complex<T>* dev_E;
	73	+ HANDLE_ERROR( cudaMalloc(&dev_E, sizeof(stim::complex<T>) * nx * ny) ); //allocate space for the field
	74	+
	75	+ cufftResult result;
	76	+ cufftHandle plan;
	77	+ result = cufftPlan2d(&plan, nx, ny, CUFFT_C2C);
	78	+ if(result != CUFFT_SUCCESS){
	79	+ std::cout<<"Error creating cuFFT plan."<<std::endl;
	80	+ exit(1);
	81	+ }
	82	+
	83	+ result = cufftExecC2C(plan, (cufftComplex)dev_FFT, (cufftComplex)dev_E, CUFFT_FORWARD);
	84	+ if(result != CUFFT_SUCCESS){
	85	+ std::cout<<"Error using cuFFT to perform a forward Fourier transform of the field."<<std::endl;
	86	+ exit(1);
	87	+ }
	88	+
	89	+ HANDLE_ERROR( cudaMemcpy(E, dev_E, sizeof(stim::complex<T>) * nx * ny, cudaMemcpyDeviceToHost) );
	90	+
	91	+
	92	+ }
	93	+
	94	+ /// Propagate a field slice along its orthogonal direction by a given distance z
	95	+ /// @param Enew is the resulting propogated field
	96	+ template<typename T>
	97	+ void cpu_scalar_propagate(stim::complex<T>* Enew, stim::complex<T>* E, T sx, T sy, T z, T k, size_t nx, size_t ny){
	98	+
	99	+ stim::complex<T>* K = (stim::complex<T>) malloc( sizeof(stim::complex<T>) nx * ny );
	100	+
	101	+ T Kx, Ky; //width and height in k space
	102	+ cpu_scalar_to_kspace(K, Kx, Ky, E ,sx, sy, nx, ny);
	103	+
	104	+ T* mag = (T) malloc( sizeof(T) nx * ny );
	105	+ stim::abs(mag, K, nx * ny);
	106	+ stim::cpu2image<float>(mag, "kspace_pre_shift.bmp", nx, ny, stim::cmBrewer);
	107	+
	108	+ size_t kxi, kyi;
	109	+ size_t i;
	110	+ T kx, kx_sq, ky, ky_sq, k_sq;
	111	+ T kz;
	112	+ stim::complex<T> shift;
	113	+ T min_kx = -Kx / 2;
	114	+ T dkx = Kx / (nx);
	115	+ T min_ky = -Ky / 2;
	116	+ T dky = Ky / (ny);
	117	+ for(kyi = 0; kyi < ny; kyi++){ //for each plane wave in the ky direction
	118	+ for(kxi = 0; kxi < nx; kxi++){ //for each plane wave in the ky direction
	119	+ i = kyi * nx + kxi;
	120	+
	121	+ kx = min_kx + kxi * dkx; //calculate the position of the current plane wave
	122	+ ky = min_ky + kyi * dky;
	123	+
	124	+ kx_sq = kx * kx;
	125	+ ky_sq = ky * ky;
	126	+ k_sq = k*k;
	127	+
	128	+ if(kx_sq + ky_sq < k_sq){
	129	+ kz = sqrt(kk - kx kx - ky * ky); //estimate kz using the Fresnel approximation
	130	+ shift = -exp(stim::complex<T>(0, kz * z));
	131	+ K[i] *= shift;
	132	+ }
	133	+ else{
	134	+ K[i] = 0;
	135	+ }
	136	+ }
	137	+ }
	138	+
	139	+ stim::abs(mag, K, nx * ny);
	140	+ stim::cpu2image<float>(mag, "kspace_post_shift.bmp", nx, ny, stim::cmBrewer);
	141	+
	142	+ cpu_scalar_from_kspace(Enew, sx, sy, K, Kx, Ky, nx, ny);
	143	+ }
	144	+
	145	+}
	146	+
	147	+
	148	+#endif
0	149	\ No newline at end of file
...	...

stim/optics/scalarfield.h 0 → 100644

Wrap text Show/Hide comments View file @ad2123e

	1	+#ifndef STIM_SCALARFIELD_H
	2	+#define STIM_SCALARFIELD_H
	3	+
	4	+#include "../math/rect.h"
	5	+#include "../math/complex.h"
	6	+
	7	+namespace stim{
	8	+
	9	+ enum locationType {CPUmem, GPUmem};
	10	+
	11	+ /// Class represents a scalar optical field.
	12	+
	13	+ /// In general, this class is designed to operate between the CPU and GPU. So, make sure all functions have an option to create the output on either.
	14	+ /// The field is stored either on the GPU or host memory, but not both. This enforces that there can't be different copies of the same field.
	15	+ /// This class is designed to be included in all of the other scalar optics classes, allowing them to render output data so make sure to keep it general and compatible.
	16	+
	17	+template<typename T>
	18	+class scalarfield : public rect<T>{
	19	+
	20	+protected:
	21	+ stim::complex<T>* E;
	22	+ size_t R[2];
	23	+ locationType loc;
	24	+
	25	+
	26	+
	27	+public:
	28	+
	29	+ CUDA_CALLABLE scalarfield(size_t X, size_t Y, T size = 1, T z_pos = 0) : rect<T>::rect(size, z_pos){
	30	+ R[0] = X; //set the field resolution
	31	+ R[1] = Y;
	32	+
	33	+ E = (stim::complex<T>) malloc(sizeof(stim::complex<T>) R[0] * R[1]); //allocate in CPU memory
	34	+ loc = CPUmem;
	35	+ }
	36	+
	37	+ CUDA_CALLABLE ~scalarfield(){
	38	+ if(loc == CPUmem) free(E);
	39	+ else cudaFree(E);
	40	+ }
	41	+
	42	+ /// Returns the number of values in the field
	43	+ CUDA_CALLABLE size_t size(){
	44	+ return R[0] * R[1];
	45	+ }
	46	+
	47	+ CUDA_CALLABLE size_t grid_bytes(){
	48	+ return sizeof(stim::complex<T>) * R[0] * R[1];
	49	+ }
	50	+
	51	+ /// Calculates the distance between points on the grid
	52	+ T spacing(){
	53	+ T du = rect<T>::X.len() / R[0];
	54	+ T dv = rect<T>::Y.len() / R[1];
	55	+ return min<T>(du, dv);
	56	+ }
	57	+
	58	+ /// Copy the field array to the GPU, if it isn't already there
	59	+ void to_gpu(){
	60	+ if(loc == GPUmem) return;
	61	+ else{
	62	+ stim::complex<T>* dev_E;
	63	+ HANDLE_ERROR( cudaMalloc(&dev_E, e_bytes()) ); //allocate GPU memory
	64	+ HANDLE_ERROR( cudaMemcpy(dev_E, E, e_bytes(), cudaMemcpyHostToDevice) ); //copy the field to the GPU
	65	+ free(E); //free the CPU memory
	66	+ E = dev_E; //swap pointers
	67	+ }
	68	+ }
	69	+
	70	+ /// Copy the field array to the CPU, if it isn't already there
	71	+ void to_cpu(){
	72	+ if(loc == CPUmem) return;
	73	+ else{
	74	+ stim::complex<T>* host_E = (stim::complex<T>*) malloc(e_bytes()); //allocate space in main memory
	75	+ HANDLE_ERROR( cudaMemcpy(host_E, E, e_bytes(), cudaMemcpyDeviceToHost) ); //copy from GPU to CPU
	76	+ HANDLE_ERROR( cudaFree(E) ); //free device memory
	77	+ E = host_E; //swap pointers
	78	+ }
	79	+ }
	80	+
	81	+ std::string str(){
	82	+ std::stringstream ss;
	83	+ ss<<rect<T>::str()<<std::endl;
	84	+ ss<<"[ "<<R[0]<<" x "<<R[1]<<" ]"<<std::endl;
	85	+ ss<<"location: ";
	86	+ if(loc == CPUmem) ss<<"CPU";
	87	+ else ss<<"GPU";
	88	+
	89	+ ss<<endl;
	90	+ return ss.str();
	91	+ }
	92	+
	93	+ stim::complex<T>* ptr(){
	94	+ return E;
	95	+ }
	96	+
	97	+ /// Evaluate the cartesian coordinates of each point in the field. The resulting arrays are allocated in the same memory where the field is stored.
	98	+ void meshgrid(T* X, T* Y, T* Z, locationType location){
	99	+ size_t array_size = sizeof(T) * R[0] * R[1];
	100	+ if(location == CPUmem){
	101	+
	102	+ T du = 1.0 / (R[0] - 1); //calculate the spacing between points in the grid
	103	+ T dv = 1.0 / (R[1] - 1);
	104	+
	105	+ size_t ui, vi, i;
	106	+ stim::vec3<T> p;
	107	+ for(vi = 0; vi < R[1]; vi++){
	108	+ i = vi * R[0];
	109	+ for(ui = 0; ui < R[0]; ui++){
	110	+ p = rect<T>::p(ui * du, vi * dv);
	111	+ X[i] = p[0];
	112	+ Y[i] = p[1];
	113	+ Z[i] = p[2];
	114	+ i++;
	115	+ }
	116	+ }
	117	+ stim::cpu2image(X, "X.bmp", R[0], R[1], stim::cmBrewer);
	118	+ stim::cpu2image(Y, "Y.bmp", R[0], R[1], stim::cmBrewer);
	119	+ stim::cpu2image(Z, "Z.bmp", R[0], R[1], stim::cmBrewer);
	120	+ }
	121	+ else{
	122	+ std::cout<<"GPU allocation of a meshgrid isn't supported yet. You'll have to write kernels to do the calculation.";
	123	+ exit(1);
	124	+ }
	125	+ }
	126	+
	127	+ void image(std::string filename, stim::complexComponentType type = complexMag, stim::colormapType cmap = stim::cmBrewer){
	128	+
	129	+ if(loc == GPUmem) to_cpu(); //if the field is in the GPU, move it to the CPU
	130	+ T* image = (T) malloc( sizeof(T) size() ); //allocate space for the real image
	131	+
	132	+ switch(type){ //get the specified component from the complex value
	133	+ case complexMag:
	134	+ stim::abs(image, E, size());
	135	+ break;
	136	+ case complexReal:
	137	+ stim::real(image, E, size());
	138	+ break;
	139	+ case complexImaginary:
	140	+ stim::imag(image, E, size());
	141	+ }
	142	+ stim::cpu2image(image, filename, R[0], R[1], cmap); //save the resulting image
	143	+ free(image); //free the real image
	144	+ }
	145	+
	146	+}; //end class scalarfield
	147	+}
	148	+
	149	+//stream insertion operator
	150	+template<typename T>
	151	+std::ostream& operator<<(std::ostream& os, stim::scalarfield<T>& rhs){
	152	+ os<<rhs.str();
	153	+ return os;
	154	+}
	155	+
	156	+
	157	+#endif
0	158	\ No newline at end of file
...	...