fixed precision problems

David Mayerich
1 parent 57729e5b
Showing 12 changed files with 46 additions and 1273 deletions Show diff stats
math/complex.h
math/complex.h~
math/matrix.h~
math/point.h
math/point.h~
math/quad.h
math/quad.h~
math/quaternion.h
math/quaternion.h~
math/spherical_bessel.h
math/vector.h~
visualization/camera.h
@@ -5,7 +5,7 @@ and can therefore be used in CUDA code and on CUDA devices.
 #ifndef RTS_COMPLEX
 #define RTS_COMPLEX
  
-#include "cuda_callable.h"
+#include "../cuda/callable.h"
 #include <cmath>
 #include <string>
 #include <sstream>
@@ -22,8 +22,8 @@ struct complex
     //default constructor
     CUDA_CALLABLE complex()
     {
-        r = 0.0;
-		i = 0.0;
+        r = 0;
+	i = 0;
     }
  
 	//access methods
@@ -235,7 +235,7 @@ struct complex
  
 		//find the square root
 		T a_p = std::sqrt(a);
-		T theta_p = theta/2.0;
+		T theta_p = theta/2.0f;
  
 		//convert back to cartesian coordinates
 		result.r = a_p * std::cos(theta_p);
@@ -262,7 +262,7 @@ struct complex
  
     CUDA_CALLABLE bool operator==(T rhs)
 	{
-        if(r == rhs && i == (T)0.0)
+        if(r == rhs && i == 0)
             return true;
         return false;
     }
-/*RTS Complex number class.  This class is CUDA compatible,
-and can therefore be used in CUDA code and on CUDA devices.
-*/
-
-#ifndef RTS_COMPLEX
-#define RTS_COMPLEX
-
-#include "cuda_callable.h"
-#include <cmath>
-#include <string>
-#include <sstream>
-#include <iostream>
-
-namespace rts
-{
-
-template <class T>
-struct complex
-{
-    T r, i;
-
-    //default constructor
-    CUDA_CALLABLE complex()
-    {
-        r = 0.0;
-		i = 0.0;
-    }
-
-	//access methods
-	CUDA_CALLABLE T real()
-	{
-		return r;
-	}
-
-	CUDA_CALLABLE T real(T r_val)
-	{
-		r = r_val;
-		return r_val;
-	}
-
-	CUDA_CALLABLE T imag()
-	{
-		return i;
-	}
-	CUDA_CALLABLE T imag(T i_val)
-	{
-		i = i_val;
-		return i_val;
-	}
-
-    //constructor when given real and imaginary values
-    CUDA_CALLABLE complex(T r, T i)
-    {
-        this->r = r;
-        this->i = i;
-    }
-
-    //return the current value multiplied by i
-    CUDA_CALLABLE complex<T> imul()
-    {
-        complex<T> result;
-        result.r = -i;
-        result.i = r;
-
-        return result;
-    }
-
-	//ARITHMETIC OPERATORS--------------------
-
-    //binary + operator (returns the result of adding two complex values)
-    CUDA_CALLABLE complex<T> operator+ (const complex<T> rhs)
-    {
-        complex<T> result;
-        result.r = r + rhs.r;
-        result.i = i + rhs.i;
-        return result;
-    }
-
-	CUDA_CALLABLE complex<T> operator+ (const T rhs)
-    {
-        complex<T> result;
-        result.r = r + rhs;
-        result.i = i;
-        return result;
-    }
-
-    //binary - operator (returns the result of adding two complex values)
-    CUDA_CALLABLE complex<T> operator- (const complex<T> rhs)
-    {
-        complex<T> result;
-        result.r = r - rhs.r;
-        result.i = i - rhs.i;
-        return result;
-    }
-
-    //binary - operator (returns the result of adding two complex values)
-    CUDA_CALLABLE complex<T> operator- (const T rhs)
-    {
-        complex<T> result;
-        result.r = r - rhs;
-        result.i = i;
-        return result;
-    }
-
-    //binary MULTIPLICATION operators (returns the result of multiplying complex values)
-    CUDA_CALLABLE complex<T> operator* (const complex<T> rhs)
-    {
-        complex<T> result;
-        result.r = r * rhs.r - i * rhs.i;
-        result.i = r * rhs.i + i * rhs.r;
-        return result;
-    }
-    CUDA_CALLABLE complex<T> operator* (const T rhs)
-    {
-        return complex<T>(r * rhs, i * rhs);
-    }
-
-    //binary DIVISION operators (returns the result of dividing complex values)
-    CUDA_CALLABLE complex<T> operator/ (const complex<T> rhs)
-    {
-        complex<T> result;
-        T denom = rhs.r * rhs.r + rhs.i * rhs.i;
-        result.r = (r * rhs.r + i * rhs.i) / denom;
-        result.i = (- r * rhs.i + i * rhs.r) / denom;
-
-        return result;
-    }
-    CUDA_CALLABLE complex<T> operator/ (const T rhs)
-    {
-        return complex<T>(r / rhs, i / rhs);
-    }
-
-    //ASSIGNMENT operators-----------------------------------
-    CUDA_CALLABLE complex<T> & operator=(const complex<T> &rhs)
-    {
-        //check for self-assignment
-        if(this != &rhs)
-        {
-            this->r = rhs.r;
-            this->i = rhs.i;
-        }
-        return *this;
-    }
-    CUDA_CALLABLE complex<T> & operator=(const T &rhs)
-    {
-        this->r = rhs;
-        this->i = 0;
-
-		return *this;
-    }
-
-    //arithmetic assignment operators
-    CUDA_CALLABLE complex<T> operator+=(const complex<T> &rhs)
-    {
-		*this = *this + rhs;
-        return *this;
-    }
-    CUDA_CALLABLE complex<T> operator+=(const T &rhs)
-    {
-		*this = *this + rhs;
-        return *this;
-    }
-
-    CUDA_CALLABLE complex<T> operator*=(const complex<T> &rhs)
-    {
-		*this = *this * rhs;
-        return *this;
-    }
-	CUDA_CALLABLE complex<T> operator*=(const T &rhs)
-    {
-		*this = *this * rhs;
-        return *this;
-    }
-	//divide and assign
-	CUDA_CALLABLE complex<T> operator/=(const complex<T> &rhs)
-    {
-		*this = *this / rhs;
-        return *this;
-    }
-    CUDA_CALLABLE complex<T> operator/=(const T &rhs)
-    {
-		*this = *this / rhs;
-        return *this;
-    }
-
-    //absolute value operator (returns the absolute value of the complex number)
-	CUDA_CALLABLE T abs()
-	{
-		return std::sqrt(r * r + i * i);
-	}
-
-	CUDA_CALLABLE complex<T> log()
-	{
-        complex<T> result;
-        result.r = std::log(std::sqrt(r * r + i * i));
-        result.i = std::atan2(i, r);
-
-
-        return result;
-	}
-
-	CUDA_CALLABLE complex<T> exp()
-	{
-        complex<T> result;
-
-        T e_r = std::exp(r);
-        result.r = e_r * std::cos(i);
-        result.i = e_r * std::sin(i);
-
-        return result;
-	}
-
-	/*CUDA_CALLABLE complex<T> pow(int y)
-	{
-
-        return pow((double)y);
-	}*/
-
-	CUDA_CALLABLE complex<T> pow(T y)
-	{
-        complex<T> result;
-
-        result = log() * y;
-
-        return result.exp();
-	}
-
-	CUDA_CALLABLE complex<T> sqrt()
-	{
-		complex<T> result;
-
-		//convert to polar coordinates
-		T a = std::sqrt(r*r + i*i);
-		T theta = std::atan2(i, r);
-
-		//find the square root
-		T a_p = std::sqrt(a);
-		T theta_p = theta/2.0;
-
-		//convert back to cartesian coordinates
-		result.r = a_p * std::cos(theta_p);
-		result.i = a_p * std::sin(theta_p);
-
-		return result;
-	}
-
-	std::string toStr()
-	{
-		std::stringstream ss;
-		ss<<"("<<r<<","<<i<<")";
-
-		return ss.str();
-	}
-
-	//COMPARISON operators
-	CUDA_CALLABLE bool operator==(complex<T> rhs)
-	{
-        if(r == rhs.r && i == rhs.i)
-            return true;
-        return false;
-    }
-
-    CUDA_CALLABLE bool operator==(T rhs)
-	{
-        if(r == rhs && i == (T)0.0)
-            return true;
-        return false;
-    }
-
-};
-
-}	//end RTS namespace
-
-//addition
-template<typename T>
-CUDA_CALLABLE static rts::complex<T> operator+(const double a, const rts::complex<T> b)
-{
-    return rts::complex<T>(a + b.r, b.i);
-}
-
-//subtraction with a real value
-template<typename T>
-CUDA_CALLABLE static rts::complex<T> operator-(const double a, const rts::complex<T> b)
-{
-    return rts::complex<T>(a - b.r, -b.i);
-}
-
-//minus sign
-template<typename T>
-CUDA_CALLABLE static rts::complex<T> operator-(const rts::complex<T> &rhs)
-{
-    return rts::complex<T>(-rhs.r, -rhs.i);
-}
-
-//multiply a T value by a complex value
-template<typename T>
-CUDA_CALLABLE static rts::complex<T> operator*(const double a, const rts::complex<T> b)
-{
-    return rts::complex<T>((T)a * b.r, (T)a * b.i);
-}
-
-//divide a T value by a complex value
-template<typename T>
-CUDA_CALLABLE static rts::complex<T> operator/(const double a, const rts::complex<T> b)
-{
-    //return complex<T>(a * b.r, a * b.i);
-    rts::complex<T> result;
-
-    T denom = b.r * b.r + b.i * b.i;
-
-    result.r = (a * b.r) / denom;
-    result.i = -(a * b.i) / denom;
-
-    return result;
-}
-
-//POW function
-/*template<typename T>
-CUDA_CALLABLE static complex<T> pow(complex<T> x, int y)
-{
-	return x.pow(y);
-}*/
-
-template<typename T>
-CUDA_CALLABLE static rts::complex<T> pow(rts::complex<T> x, T y)
-{
-	return x.pow(y);
-}
-
-//log function
-template<typename T>
-CUDA_CALLABLE static rts::complex<T> log(rts::complex<T> x)
-{
-	return x.log();
-}
-
-//exp function
-template<typename T>
-CUDA_CALLABLE static rts::complex<T> exp(rts::complex<T> x)
-{
-	return x.exp();
-}
-
-//sqrt function
-template<typename T>
-CUDA_CALLABLE static rts::complex<T> sqrt(rts::complex<T> x)
-{
-	return x.sqrt();
-}
-
-
-template <typename T>
-CUDA_CALLABLE static T abs(rts::complex<T> a)
-{
-    return a.abs();
-}
-
-template <typename T>
-CUDA_CALLABLE static T real(rts::complex<T> a)
-{
-    return a.r;
-}
-
-//template <typename T>
-CUDA_CALLABLE static float real(float a)
-{
-    return a;
-}
-
-template <typename T>
-CUDA_CALLABLE static T imag(rts::complex<T> a)
-{
-    return a.i;
-}
-
-//trigonometric functions
-template<class A>
-CUDA_CALLABLE rts::complex<A> sin(const rts::complex<A> x)
-{
-	rts::complex<A> result;
-	result.r = std::sin(x.r) * std::cosh(x.i);
-	result.i = std::cos(x.r) * std::sinh(x.i);
-
-	return result;
-}
-
-template<class A>
-CUDA_CALLABLE rts::complex<A> cos(const rts::complex<A> x)
-{
-	rts::complex<A> result;
-	result.r = std::cos(x.r) * std::cosh(x.i);
-	result.i = -(std::sin(x.r) * std::sinh(x.i));
-
-	return result;
-}
-
-
-template<class A>
-std::ostream& operator<<(std::ostream& os, rts::complex<A> x)
-{
-    os<<x.toStr();
-    return os;
-}
-
-#if __GNUC__ > 3 && __GNUC_MINOR__ > 7
-template<class T> using rtsComplex = rts::complex<T>;
-#endif
-
-
-
-#endif
-#ifndef RTS_MATRIX_H
-#define RTS_MATRIX_H
-
-//#include "rts/vector.h"
-#include <string.h>
-#include <iostream>
-
-namespace rts
-{
-
-template <class T, int N>
-struct matrix
-{
-	//the matrix will be stored in column-major order (compatible with OpenGL)
-	T M[N*N];
-
-	matrix()
-	{
-		for(int r=0; r<N; r++)
-			for(int c=0; c<N; c++)
-				if(r == c)
-					(*this)(r, c) = 1;
-				else
-					(*this)(r, c) = 0;
-	}
-
-	T& operator()(int row, int col)
-	{
-		return M[col * N + row];
-	}
-
-	matrix<T, N> operator=(T rhs)
-	{
-		int Nsq = N*N;
-		for(int i=0; i<Nsq; i++)
-			M[i] = rhs;
-
-		return *this;
-	}
-
-	/*matrix<T, N> operator=(matrix<T, N> rhs)
-	{
-		for(int i=0; i<N; i++)
-			M[i] = rhs.M[i];
-
-		return *this;
-	}*/
-
-	vector<T, N> operator*(vector<T, N> rhs)
-	{
-		vector<T, N> result;
-
-		for(int r=0; r<N; r++)
-			for(int c=0; c<N; c++)
-				result[r] += (*this)(r, c) * rhs[c];
-
-		return result;
-	}
-
-	std::string toStr()
-	{
-		std::stringstream ss;
-
-		for(int r = 0; r < N; r++)
-		{
-			ss<<"| ";
-			for(int c=0; c<N; c++)
-			{
-				ss<<(*this)(r, c)<<" ";
-			}
-			ss<<"|"<<std::endl;
-		}
-
-		return ss.str();
-	}
-
-
-
-
-};
-
-}	//end namespace rts
-
-template <typename T, int N>
-std::ostream& operator<<(std::ostream& os, rts::matrix<T, N> M)
-{
-    os<<M.toStr();
-    return os;
-}
-
-#if __GNUC__ > 3 && __GNUC_MINOR__ > 7
-template<class T, int N> using rtsMatrix = rts::matrix<T, N>;
-#endif
-
-#endif
@@ -19,16 +19,27 @@ struct point
 	}
  
 	//efficiency constructor, makes construction easier for 1D-4D vectors
-	CUDA_CALLABLE point(T x, T y = (T)0.0, T z = (T)0.0, T w = (T)0.0)
+	CUDA_CALLABLE point(T x)
 	{
-		if(N >= 1)
-			p[0] = x;
-		if(N >= 2)
-			p[1] = y;
-		if(N >= 3)
-			p[2] = z;
-		if(N >= 4)
-			p[3] = w;
+		p[0] = x;
+	}
+	CUDA_CALLABLE point(T x, T y)
+	{
+		p[0] = x;
+		p[1] = y;
+	}
+	CUDA_CALLABLE point(T x, T y, T z)
+	{
+		p[0] = x;
+		p[1] = y;
+		p[2] = z;
+	}
+	CUDA_CALLABLE point(T x, T y, T z, T w)
+	{
+		p[0] = x;
+		p[1] = y;
+		p[2] = z;
+		p[3] = w;
 	}
  
 	//arithmetic operators
-#ifndef RTS_rtsPoint_H
-#define RTS_rtsPoint_H
-
-#include "rts/math/vector.h"
-#include <string.h>
-#include "rts/cuda/callable.h"
-
-namespace rts
-{
-
-template <class T, int N>
-struct point
-{
-	T p[N];
-
-	CUDA_CALLABLE point()
-	{
-
-	}
-
-	//efficiency constructor, makes construction easier for 1D-4D vectors
-	CUDA_CALLABLE point(T x, T y = (T)0.0, T z = (T)0.0, T w = (T)0.0)
-	{
-		if(N >= 1)
-			p[0] = x;
-		if(N >= 2)
-			p[1] = y;
-		if(N >= 3)
-			p[2] = z;
-		if(N >= 4)
-			p[3] = w;
-	}
-
-	//arithmetic operators
-	CUDA_CALLABLE rts::point<T, N> operator+(vector<T, N> v)
-	{
-        rts::point<T, N> r;
-
-        //calculate the position of the resulting point
-        for(int i=0; i<N; i++)
-            r.p[i] = p[i] + v.v[i];
-
-        return r;
-	}
-	CUDA_CALLABLE rts::point<T, N> operator-(vector<T, N> v)
-	{
-        rts::point<T, N> r;
-
-        //calculate the position of the resulting point
-        for(int i=0; i<N; i++)
-            r.p[i] = p[i] - v.v[i];
-
-        return r;
-	}
-	CUDA_CALLABLE vector<T, N> operator-(point<T, N> rhs)
-	{
-        vector<T, N> r;
-
-        //calculate the position of the resulting point
-        for(int i=0; i<N; i++)
-            r.v[i] = p[i] - rhs.p[i];
-
-        return r;
-	}
-	CUDA_CALLABLE rts::point<T, N> operator*(T rhs)
-	{
-        rts::point<T, N> r;
-
-        //calculate the position of the resulting point
-        for(int i=0; i<N; i++)
-            r.p[i] = p[i] * rhs;
-
-        return r;
-	}
-
-	CUDA_CALLABLE point(const T(&data)[N])
-	{
-		memcpy(p, data, sizeof(T) * N);
-	}
-
-	std::string toStr()
-	{
-		std::stringstream ss;
-
-		ss<<"(";
-		for(int i=0; i<N; i++)
-		{
-			ss<<p[i];
-			if(i != N-1)
-				ss<<", ";
-		}
-		ss<<")";
-
-		return ss.str();
-	}
-
-	//bracket operator
-	CUDA_CALLABLE T& operator[](int i)
-	{
-        return p[i];
-    }
-
-};
-
-}	//end namespace rts
-
-template <typename T, int N>
-std::ostream& operator<<(std::ostream& os, rts::point<T, N> p)
-{
-    os<<p.toStr();
-    return os;
-}
-
-//arithmetic
-template <typename T, int N>
-CUDA_CALLABLE rts::point<T, N> operator*(T lhs, rts::point<T, N> rhs)
-{
-    rts::point<T, N> r;
-
-    return rhs * lhs;
-}
-
-#if __GNUC__ > 3 && __GNUC_MINOR__ > 7
-template<class T, int N> using rtsPoint = rts::point<T, N>;
-#endif
-
-#endif
@@ -69,11 +69,11 @@ struct quad
  
         //calculate point B
         rts::point<T, 3> B;
-        B = A + v0 * 0.5 + v1 * 0.5;
+        B = A + v0 * 0.5f + v1 * 0.5f;
  
         //calculate rtsPoint C
         rts::point<T, 3> C;
-        C = A  + v0 * 0.5 - v1 * 0.5;
+        C = A  + v0 * 0.5f - v1 * 0.5f;
  
         //calculate X and Y
         X = B - A;
@@ -110,7 +110,7 @@ struct quad
         Y = Y * height;
  
         //set the corner of the plane
-        A = c - X * 0.5 - Y * 0.5;
+        A = c - X * 0.5f - Y * 0.5f;
  
         std::cout<<X<<std::endl;
 	}
@@ -155,13 +155,13 @@ struct quad
 		//scales the plane by a scalar value
  
 		//compute the center point
-		rts::point<T, N> c = A + X*0.5 + Y*0.5;
+		rts::point<T, N> c = A + X*0.5f + Y*0.5f;
  
 		//create the new quadangle
 		quad<T, N> result;
 		result.X = X * rhs;
 		result.Y = Y * rhs;
-		result.A = c - result.X*0.5 - result.Y*0.5;
+		result.A = c - result.X*0.5f - result.Y*0.5f;
  
 		return result;
  
@@ -192,7 +192,7 @@ struct quad
         T dc = (A+Y - p).len();
         T dd = (A+X+Y - p).len();
  
-        return std::max( da, std::max(db, std::max(dc, dd) ) );
+        return fmax( da, fmax(db, fmax(dc, dd) ) );
 	}
 };
  
-#ifndef RTS_RECT_H
-#define RTS_RECT_H
-
-//enable CUDA_CALLABLE macro
-#include "rts/cuda/callable.h"
-#include "rts/math/vector.h"
-#include "rts/math/point.h"
-#include "rts/math/triangle.h"
-#include "rts/math/quaternion.h"
-#include <iostream>
-#include <algorithm>
-
-namespace rts{
-
-//template for a quadangle class in ND space
-template <class T, int N>
-struct quad
-{
-	/*
-		C------------------>O
-		^                   ^
-		|                   |
-		Y                   |
-		|                   |
-		|                   |
-		A---------X-------->B
-	*/
-
-	/*T A[N];
-	T B[N];
-	T C[N];*/
-
-	rts::point<T, N> A;
-	rts::vector<T, N> X;
-	rts::vector<T, N> Y;
-
-
-	CUDA_CALLABLE quad()
-	{
-
-	}
-
-	CUDA_CALLABLE quad(point<T, N> a, point<T, N> b, point<T, N> c)
-	{
-
-		A = a;
-		X = b - a;
-		Y = c - a;
-
-	}
-
-    /****************************************************************
-    Constructor - create a quad from two points and a normal
-    ****************************************************************/
-	CUDA_CALLABLE quad(rts::point<T, N> pMin, rts::point<T, N> pMax, rts::vector<T, N> normal)
-	{
-
-        //assign the corner point
-        A = pMin;
-
-        //compute the vector from pMin to pMax
-        rts::vector<T, 3> v0;
-        v0 = pMax - pMin;
-
-        //compute the cross product of A and the plane normal
-        rts::vector<T, 3> v1;
-        v1 = v0.cross(normal);
-
-
-        //calculate point B
-        rts::point<T, 3> B;
-        B = A + v0 * 0.5 + v1 * 0.5;
-
-        //calculate rtsPoint C
-        rts::point<T, 3> C;
-        C = A  + v0 * 0.5 - v1 * 0.5;
-
-        //calculate X and Y
-        X = B - A;
-        Y = C - A;
-	}
-
-	/*******************************************************************
-	Constructor - create a quad from a position, normal, and rotation
-	*******************************************************************/
-	CUDA_CALLABLE quad(rts::point<T, N> c, rts::vector<T, N> normal, T width, T height, T theta)
-	{
-
-        //compute the X direction - start along world-space X
-        Y = rts::vector<T, N>(0, 1, 0);
-        if(Y == normal)
-            Y = rts::vector<T, N>(0, 0, 1);
-
-        X = Y.cross(normal).norm();
-
-        std::cout<<X<<std::endl;
-
-        //rotate the X axis by theta radians
-        rts::quaternion<T> q;
-        q.CreateRotation(theta, normal);
-        X = q.toMatrix3() * X;
-        Y = normal.cross(X);
-
-        //normalize everything
-        X = X.norm();
-        Y = Y.norm();
-
-        //scale to match the quad width and height
-        X = X * width;
-        Y = Y * height;
-
-        //set the corner of the plane
-        A = c - X * 0.5 - Y * 0.5;
-
-        std::cout<<X<<std::endl;
-	}
-
-	/*******************************************
-	Return the normal for the quad
-	*******************************************/
-	CUDA_CALLABLE rts::vector<T, N> n()
-	{
-        return (X.cross(Y)).norm();
-	}
-
-	CUDA_CALLABLE rts::point<T, N> p(T a, T b)
-	{
-		rts::point<T, N> result;
-		//given the two parameters a, b = [0 1], returns the position in world space
-		result = A + X * a + Y * b;
-
-		return result;
-	}
-
-	CUDA_CALLABLE rts::point<T, N> operator()(T a, T b)
-	{
-		return p(a, b);
-	}
-
-	std::string toStr()
-	{
-		std::stringstream ss;
-
-		ss<<"A = "<<A<<std::endl;
-		ss<<"B = "<<A + X<<std::endl;
-		ss<<"C = "<<A + X + Y<<std::endl;
-		ss<<"D = "<<A + Y<<std::endl;
-
-        return ss.str();
-
-	}
-
-	CUDA_CALLABLE quad<T, N> operator*(T rhs)
-	{
-		//scales the plane by a scalar value
-
-		//compute the center point
-		rts::point<T, N> c = A + X*0.5 + Y*0.5;
-
-		//create the new quadangle
-		quad<T, N> result;
-		result.X = X * rhs;
-		result.Y = Y * rhs;
-		result.A = c - result.X*0.5 - result.Y*0.5;
-
-		return result;
-
-	}
-
-	CUDA_CALLABLE T dist(point<T, N> p)
-	{
-        //compute the distance between a point and this quad
-
-        //first break the quad up into two triangles
-        triangle<T, N> T0(A, A+X, A+Y);
-        triangle<T, N> T1(A+X+Y, A+X, A+Y);
-
-
-        ptype d0 = T0.dist(p);
-        ptype d1 = T1.dist(p);
-
-        if(d0 < d1)
-            return d0;
-        else
-            return d1;
-	}
-
-	CUDA_CALLABLE T dist_max(point<T, N> p)
-	{
-        T da = (A - p).len();
-        T db = (A+X - p).len();
-        T dc = (A+Y - p).len();
-        T dd = (A+X+Y - p).len();
-
-        return std::max( da, max(db, max(dc, dd) ) );
-	}
-};
-
-}	//end namespace rts
-
-template <typename T, int N>
-std::ostream& operator<<(std::ostream& os, rts::quad<T, N> R)
-{
-    os<<R.toStr();
-    return os;
-}
-
-
-#endif
@@ -41,10 +41,10 @@ template&lt;typename T&gt;
 void quaternion<T>::CreateRotation(T theta, T axis_x, T axis_y, T axis_z)
 {
 	//assign the given Euler rotation to this quaternion
-	w = (T)cos(theta/2.0);
-	x = axis_x*(T)sin(theta/2.0);
-	y = axis_y*(T)sin(theta/2.0);
-	z = axis_z*(T)sin(theta/2.0);
+	w = (T)cos(theta/2);
+	x = axis_x*(T)sin(theta/2);
+	y = axis_y*(T)sin(theta/2);
+	z = axis_z*(T)sin(theta/2);
 }
  
 template<typename T>
@@ -93,20 +93,20 @@ matrix&lt;T, 3&gt; quaternion&lt;T&gt;::toMatrix3()
     yy = y * y2; yz = y * z2; zz = z * z2;
     wx = w * x2; wy = w * y2; wz = w * z2;
  
-	result(0, 0) = (T)1.0 - (yy + zz);
+	result(0, 0) = 1 - (yy + zz);
 	result(0, 1) = xy - wz;
  
 	result(0, 2) = xz + wy;
  
 	result(1, 0) = xy + wz;
-	result(1, 1) = (T)1.0 - (xx + zz);
+	result(1, 1) = 1 - (xx + zz);
  
 	result(1, 2) = yz - wx;
  
 	result(2, 0) = xz - wy;
 	result(2, 1) = yz + wx;
  
-	result(2, 2) = (T)1.0 - (xx + yy);
+	result(2, 2) = 1 - (xx + yy);
  
 	return result;
 }
@@ -127,22 +127,22 @@ matrix&lt;T, 4&gt; quaternion&lt;T&gt;::toMatrix4()
     yy = y * y2; yz = y * z2; zz = z * z2;
     wx = w * x2; wy = w * y2; wz = w * z2;
  
-	result(0, 0) = (T)1.0 - (yy + zz);
+	result(0, 0) = 1 - (yy + zz);
 	result(0, 1) = xy - wz;
  
 	result(0, 2) = xz + wy;
  
 	result(1, 0) = xy + wz;
-	result(1, 1) = (T)1.0 - (xx + zz);
+	result(1, 1) = 1 - (xx + zz);
  
 	result(1, 2) = yz - wx;
  
 	result(2, 0) = xz - wy;
 	result(2, 1) = yz + wx;
  
-	result(2, 2) = (T)1.0 - (xx + yy);
+	result(2, 2) = 1 - (xx + yy);
  
-	result(3, 3) = (T)1.0;
+	result(3, 3) = 1;
  
 	return result;
 }
@@ -150,7 +150,7 @@ matrix&lt;T, 4&gt; quaternion&lt;T&gt;::toMatrix4()
 template<typename T>
 quaternion<T>::quaternion()
 {
-	w=0.0; x=0.0; y=0.0; z=0.0;
+	w=0; x=0; y=0; z=0;
 }
  
 template<typename T>
-#include "rts/math/matrix.h"
-
-#ifndef RTS_QUATERNION_H
-#define RTS_QUATERNION_H
-
-namespace rts{
-
-template<typename T>
-class quaternion
-{
-public:
-	T w;
-	T x;
-	T y;
-	T z;
-
-	void normalize();
-	void CreateRotation(T theta, T axis_x, T axis_y, T axis_z);
-	void CreateRotation(T theta, vector<T, 3> axis);
-	quaternion<T> operator*(quaternion<T> &rhs);
-	matrix<T, 3> toMatrix3();
-	matrix<T, 4> toMatrix4();
-
-
-	quaternion();
-	quaternion(T w, T x, T y, T z);
-
-};
-
-template<typename T>
-void quaternion<T>::normalize()
-{
-	double length=sqrt(w*w + x*x + y*y + z*z);
-	w=w/length;
-	x=x/length;
-	y=y/length;
-	z=z/length;
-}
-
-template<typename T>
-void quaternion<T>::CreateRotation(T theta, T axis_x, T axis_y, T axis_z)
-{
-	//assign the given Euler rotation to this quaternion
-	w = (T)cos(theta/2.0);
-	x = axis_x*(T)sin(theta/2.0);
-	y = axis_y*(T)sin(theta/2.0);
-	z = axis_z*(T)sin(theta/2.0);
-}
-
-template<typename T>
-void quaternion<T>::CreateRotation(T theta, vector<T, 3> axis)
-{
-	CreateRotation(theta, axis[0], axis[1], axis[2]);
-}
-
-template<typename T>
-quaternion<T> quaternion<T>::operator *(quaternion<T> &param)
-{
-	float A, B, C, D, E, F, G, H;
-
-
-	A = (w + x)*(param.w + param.x);
-	B = (z - y)*(param.y - param.z);
-	C = (w - x)*(param.y + param.z);
-	D = (y + z)*(param.w - param.x);
-	E = (x + z)*(param.x + param.y);
-	F = (x - z)*(param.x - param.y);
-	G = (w + y)*(param.w - param.z);
-	H = (w - y)*(param.w + param.z);
-
-	quaternion<T> result;
-	result.w = B + (-E - F + G + H) /2;
-	result.x = A - (E + F + G + H)/2;
-	result.y = C + (E - F + G - H)/2;
-	result.z = D + (E - F - G + H)/2;
-
-	return result;
-}
-
-template<typename T>
-matrix<T, 3> quaternion<T>::toMatrix3()
-{
-	matrix<T, 3> result;
-
-
-    T wx, wy, wz, xx, yy, yz, xy, xz, zz, x2, y2, z2;
-
-
-    // calculate coefficients
-    x2 = x + x; y2 = y + y;
-    z2 = z + z;
-    xx = x * x2; xy = x * y2; xz = x * z2;
-    yy = y * y2; yz = y * z2; zz = z * z2;
-    wx = w * x2; wy = w * y2; wz = w * z2;
-
-	result(0, 0) = (T)1.0 - (yy + zz);
-	result(0, 1) = xy - wz;
-
-	result(0, 2) = xz + wy;
-
-	result(1, 0) = xy + wz;
-	result(1, 1) = (T)1.0 - (xx + zz);
-
-	result(1, 2) = yz - wx;
-
-	result(2, 0) = xz - wy;
-	result(2, 1) = yz + wx;
-
-	result(2, 2) = (T)1.0 - (xx + yy);
-
-	return result;
-}
-
-template<typename T>
-matrix<T, 4> quaternion<T>::toMatrix4()
-{
-	matrix<T, 4> result;
-
-
-    T wx, wy, wz, xx, yy, yz, xy, xz, zz, x2, y2, z2;
-
-
-    // calculate coefficients
-    x2 = x + x; y2 = y + y;
-    z2 = z + z;
-    xx = x * x2; xy = x * y2; xz = x * z2;
-    yy = y * y2; yz = y * z2; zz = z * z2;
-    wx = w * x2; wy = w * y2; wz = w * z2;
-
-	result(0, 0) = (T)1.0 - (yy + zz);
-	result(0, 1) = xy - wz;
-
-	result(0, 2) = xz + wy;
-
-	result(1, 0) = xy + wz;
-	result(1, 1) = (T)1.0 - (xx + zz);
-
-	result(1, 2) = yz - wx;
-
-	result(2, 0) = xz - wy;
-	result(2, 1) = yz + wx;
-
-	result(2, 2) = (T)1.0 - (xx + yy);
-
-	result(3, 3) = (T)1.0;
-
-	return result;
-}
-
-template<typename T>
-quaternion<T>::quaternion()
-{
-	w=0.0; x=0.0; y=0.0; z=0.0;
-}
-
-template<typename T>
-quaternion<T>::quaternion(T c, T i, T j, T k)
-{
-	w=c;  x=i;  y=j;  z=k;
-}
-
-}	//end rts namespace
-
-#if __GNUC__ > 3 && __GNUC_MINOR__ > 7
-template<class T> using rtsQuaternion = rts::quaternion<T>;
-#endif
-
-#endif
@@ -111,7 +111,7 @@ CUDA_CALLABLE void shift_sbesselj(int n, T x, T* b)//, T stability = 1.4)
 	//if(n > stability*x)
 	if(n > real(x))
 		if(real(bnew) < RTS_BESSEL_CONVERGENCE_MIN || real(bnew) > RTS_BESSEL_CONVERGENCE_MAX)
-			bnew = 0.0;
+			bnew = 0;
  
 	//shift and add the new value to the array
 	b[0] = b[1];
@@ -130,8 +130,8 @@ CUDA_CALLABLE void shift_sbessely(int n, T x, T* b)//, T stability = 1.4)
 	if(bnew < RTS_BESSEL_MAXIMUM_FLOAT ||
 	   (n > x && bnew > 0))
 	{
-		bnew = (T)0;
-		b[1] = (T)0;
+		bnew = 0;
+		b[1] = 0;
 	}
  
  
-#ifndef RTS_VECTOR_H
-#define RTS_VECTOR_H
-
-#include <iostream>
-#include <cmath>
-#include <sstream>
-//#include "rts/point.h"
-#include "rts/cuda/callable.h"
-
-namespace rts
-{
-
-
-
-template <class T, int N>
-struct vector
-{
-	T v[N];
-
-	CUDA_CALLABLE vector()
-	{
-		//memset(v, 0, sizeof(T) * N);
-		for(int i=0; i<N; i++)
-			v[i] = 0;
-	}
-
-	//efficiency constructor, makes construction easier for 1D-4D vectors
-	CUDA_CALLABLE vector(T x, T y = (T)0.0, T z = (T)0.0, T w = (T)0.0)
-	{
-		if(N >= 1)
-			v[0] = x;
-		if(N >= 2)
-			v[1] = y;
-		if(N >= 3)
-			v[2] = z;
-		if(N >= 4)
-			v[3] = w;
-	}
-
-	CUDA_CALLABLE vector(const T(&data)[N])
-	{
-		memcpy(v, data, sizeof(T) * N);
-	}
-
-	CUDA_CALLABLE T len()
-	{
-        //compute and return the vector length
-        T sum_sq = (T)0;
-        for(int i=0; i<N; i++)
-        {
-            sum_sq += v[i] * v[i];
-        }
-        return std::sqrt(sum_sq);
-
-	}
-
-	CUDA_CALLABLE vector<T, N> cart2sph()
-	{
-		//convert the vector from cartesian to spherical coordinates
-		//x, y, z -> r, theta, phi (where theta = 0 to 2*pi)
-
-		vector<T, N> sph;
-		sph[0] = std::sqrt(v[0]*v[0] + v[1]*v[1] + v[2]*v[2]);
-		sph[1] = std::atan2(v[1], v[0]);
-		sph[2] = std::acos(v[2] / sph[0]);
-
-		return sph;
-	}
-
-	CUDA_CALLABLE vector<T, N> sph2cart()
-	{
-		//convert the vector from cartesian to spherical coordinates
-		//r, theta, phi -> x, y, z (where theta = 0 to 2*pi)
-
-		vector<T, N> cart;
-		cart[0] = v[0] * std::cos(v[1]) * std::sin(v[2]);
-		cart[1] = v[0] * std::sin(v[1]) * std::sin(v[2]);
-		cart[2] = v[0] * std::cos(v[2]);
-
-		return cart;
-	}
-
-	CUDA_CALLABLE vector<T, N> norm()
-	{
-        //compute and return the vector norm
-        vector<T, N> result;
-
-        //compute the vector length
-        T l = len();
-
-        //normalize
-        for(int i=0; i<N; i++)
-        {
-            result.v[i] = v[i] / l;
-        }
-
-        return result;
-	}
-
-	CUDA_CALLABLE vector<T, 3> cross(vector<T, 3> rhs)
-	{
-		vector<T, 3> result;
-
-		//compute the cross product (only valid for 3D vectors)
-		result[0] = v[1] * rhs[2] - v[2] * rhs[1];
-		result[1] = v[2] * rhs[0] - v[0] * rhs[2];
-		result[2] = v[0] * rhs[1] - v[1] * rhs[0];
-
-		return result;
-	}
-
-    CUDA_CALLABLE T dot(vector<T, N> rhs)
-    {
-        T result = (T)0;
-
-        for(int i=0; i<N; i++)
-            result += v[i] * rhs.v[i];
-
-        return result;
-
-    }
-
-	//arithmetic
-	CUDA_CALLABLE vector<T, N> operator+(vector<T, N> rhs)
-	{
-        vector<T, N> result;
-
-        for(int i=0; i<N; i++)
-            result.v[i] = v[i] + rhs.v[i];
-
-        return result;
-	}
-	CUDA_CALLABLE vector<T, N> operator-(vector<T, N> rhs)
-	{
-        vector<T, N> result;
-
-        for(int i=0; i<N; i++)
-            result.v[i] = v[i] - rhs.v[i];
-
-        return result;
-	}
-	CUDA_CALLABLE vector<T, N> operator*(T rhs)
-	{
-        vector<T, N> result;
-
-        for(int i=0; i<N; i++)
-            result.v[i] = v[i] * rhs;
-
-        return result;
-	}
-	CUDA_CALLABLE vector<T, N> operator/(T rhs)
-	{
-        vector<T, N> result;
-
-        for(int i=0; i<N; i++)
-            result.v[i] = v[i] / rhs;
-
-        return result;
-	}
-
-	CUDA_CALLABLE bool operator==(vector<T, N> rhs)
-	{
-        if ( (rhs.v[0] == v[0]) && (rhs.v[1] == v[1]) && (rhs.v[2] == v[2]) )
-            return true;
-
-        return false;
-	}
-
-	std::string toStr()
-	{
-		std::stringstream ss;
-
-		ss<<"[";
-		for(int i=0; i<N; i++)
-		{
-			ss<<v[i];
-			if(i != N-1)
-				ss<<", ";
-		}
-		ss<<"]";
-
-		return ss.str();
-	}
-
-	//bracket operator
-	CUDA_CALLABLE T& operator[](int i)
-	{
-        return v[i];
-    }
-
-};
-
-
-}	//end namespace rts
-
-template <typename T, int N>
-std::ostream& operator<<(std::ostream& os, rts::vector<T, N> v)
-{
-    os<<v.toStr();
-    return os;
-}
-
-//arithmetic operators
-template <typename T, int N>
-CUDA_CALLABLE rts::vector<T, N> operator-(rts::vector<T, N> v)
-{
-    rts::vector<T, N> r;
-
-    //negate the vector
-    for(int i=0; i<N; i++)
-        r.v[i] = -v.v[i];
-
-    return r;
-}
-
-template <typename T, int N>
-CUDA_CALLABLE rts::vector<T, N> operator*(T lhs, rts::vector<T, N> rhs)
-{
-    rts::vector<T, N> r;
-
-    return rhs * lhs;
-}
-
-#if __GNUC__ > 3 && __GNUC_MINOR__ > 7
-template<class T, int N> using rtsVector = rts::vector<T, N>;
-#endif
-
-#endif