kernel.hpp 11 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294
  1. /**
  2. * \file kernel.hpp
  3. * \author Dhairya Malhotra, dhairya.malhotra@gmail.com
  4. * \date 12-20-2011
  5. * \brief This file contains the definition of the struct Kernel and also the
  6. * implementation of various kernels for FMM.
  7. */
  8. #include <string>
  9. #include <cstdlib>
  10. #include <pvfmm_common.hpp>
  11. #include <mem_mgr.hpp>
  12. #include <vector.hpp>
  13. #include <matrix.hpp>
  14. #ifndef _PVFMM_FMM_KERNEL_HPP_
  15. #define _PVFMM_FMM_KERNEL_HPP_
  16. namespace pvfmm{
  17. template <class T>
  18. struct Kernel{
  19. public:
  20. /**
  21. * \brief Evaluate potential due to source points at target coordinates.
  22. * \param[in] r_src Coordinates of source points.
  23. * \param[in] src_cnt Number of source points.
  24. * \param[in] v_src Strength of source points.
  25. * \param[in] r_trg Coordinates of target points.
  26. * \param[in] trg_cnt Number of target points.
  27. * \param[out] k_out Output array with potential values.
  28. */
  29. typedef void (*Ker_t)(T* r_src, int src_cnt, T* v_src, int dof,
  30. T* r_trg, int trg_cnt, T* k_out, mem::MemoryManager* mem_mgr);
  31. /**
  32. * \brief Constructor.
  33. */
  34. Kernel(Ker_t poten, Ker_t dbl_poten, const char* name, int dim_, std::pair<int,int> k_dim,
  35. size_t dev_poten=(size_t)NULL, size_t dev_dbl_poten=(size_t)NULL);
  36. /**
  37. * \brief Initialize the kernel.
  38. */
  39. void Initialize(bool verbose=false) const;
  40. /**
  41. * \brief Compute the transformation matrix (on the source strength vector)
  42. * to get potential at target coordinates due to sources at the given
  43. * coordinates.
  44. * \param[in] r_src Coordinates of source points.
  45. * \param[in] src_cnt Number of source points.
  46. * \param[in] r_trg Coordinates of target points.
  47. * \param[in] trg_cnt Number of target points.
  48. * \param[out] k_out Output array with potential values.
  49. */
  50. void BuildMatrix(T* r_src, int src_cnt,
  51. T* r_trg, int trg_cnt, T* k_out) const;
  52. int dim;
  53. int ker_dim[2];
  54. std::string ker_name;
  55. Ker_t ker_poten;
  56. Ker_t dbl_layer_poten;
  57. size_t dev_ker_poten;
  58. size_t dev_dbl_layer_poten;
  59. mutable bool init;
  60. mutable bool scale_invar;
  61. mutable Vector<T> src_scal;
  62. mutable Vector<T> trg_scal;
  63. mutable Vector<Permutation<T> > perm_vec;
  64. mutable const Kernel<T>* k_s2m;
  65. mutable const Kernel<T>* k_s2l;
  66. mutable const Kernel<T>* k_s2t;
  67. mutable const Kernel<T>* k_m2m;
  68. mutable const Kernel<T>* k_m2l;
  69. mutable const Kernel<T>* k_m2t;
  70. mutable const Kernel<T>* k_l2l;
  71. mutable const Kernel<T>* k_l2t;
  72. private:
  73. Kernel();
  74. };
  75. template<typename T, void (*A)(T*, int, T*, int, T*, int, T*, mem::MemoryManager* mem_mgr),
  76. void (*B)(T*, int, T*, int, T*, int, T*, mem::MemoryManager* mem_mgr)>
  77. Kernel<T> BuildKernel(const char* name, int dim, std::pair<int,int> k_dim,
  78. const Kernel<T>* k_s2m=NULL, const Kernel<T>* k_s2l=NULL, const Kernel<T>* k_s2t=NULL,
  79. const Kernel<T>* k_m2m=NULL, const Kernel<T>* k_m2l=NULL, const Kernel<T>* k_m2t=NULL,
  80. const Kernel<T>* k_l2l=NULL, const Kernel<T>* k_l2t=NULL){
  81. size_t dev_ker_poten ;
  82. size_t dev_dbl_layer_poten;
  83. #ifdef __INTEL_OFFLOAD
  84. #pragma offload target(mic:0)
  85. #endif
  86. {
  87. dev_ker_poten =(size_t)((typename Kernel<T>::Ker_t)A);
  88. dev_dbl_layer_poten=(size_t)((typename Kernel<T>::Ker_t)B);
  89. }
  90. Kernel<T> K(A, B, name, dim, k_dim,
  91. dev_ker_poten, dev_dbl_layer_poten);
  92. K.k_s2m=k_s2m;
  93. K.k_s2l=k_s2l;
  94. K.k_s2t=k_s2t;
  95. K.k_m2m=k_m2m;
  96. K.k_m2l=k_m2l;
  97. K.k_m2t=k_m2t;
  98. K.k_l2l=k_l2l;
  99. K.k_l2t=k_l2t;
  100. return K;
  101. }
  102. template<typename T, void (*A)(T*, int, T*, int, T*, int, T*, mem::MemoryManager* mem_mgr)>
  103. Kernel<T> BuildKernel(const char* name, int dim, std::pair<int,int> k_dim,
  104. const Kernel<T>* k_s2m=NULL, const Kernel<T>* k_s2l=NULL, const Kernel<T>* k_s2t=NULL,
  105. const Kernel<T>* k_m2m=NULL, const Kernel<T>* k_m2l=NULL, const Kernel<T>* k_m2t=NULL,
  106. const Kernel<T>* k_l2l=NULL, const Kernel<T>* k_l2t=NULL){
  107. size_t dev_ker_poten ;
  108. #ifdef __INTEL_OFFLOAD
  109. #pragma offload target(mic:0)
  110. #endif
  111. {
  112. dev_ker_poten =(size_t)((typename Kernel<T>::Ker_t)A);
  113. }
  114. Kernel<T> K(A, NULL, name, dim, k_dim,
  115. dev_ker_poten, (size_t)NULL);
  116. K.k_s2m=k_s2m;
  117. K.k_s2l=k_s2l;
  118. K.k_s2t=k_s2t;
  119. K.k_m2m=k_m2m;
  120. K.k_m2l=k_m2l;
  121. K.k_m2t=k_m2t;
  122. K.k_l2l=k_l2l;
  123. K.k_l2t=k_l2t;
  124. return K;
  125. }
  126. }//end namespace
  127. #ifdef __INTEL_OFFLOAD
  128. #pragma offload_attribute(push,target(mic))
  129. #endif
  130. namespace pvfmm{ // Predefined Kernel-functions
  131. ////////////////////////////////////////////////////////////////////////////////
  132. //////// LAPLACE KERNEL ////////
  133. ////////////////////////////////////////////////////////////////////////////////
  134. /**
  135. * \brief Green's function for the Poisson's equation. Kernel tensor
  136. * dimension = 1x1.
  137. */
  138. template <class T, int newton_iter=0>
  139. void laplace_poten(T* r_src, int src_cnt, T* v_src, int dof, T* r_trg, int trg_cnt, T* k_out, mem::MemoryManager* mem_mgr);
  140. // Laplace double layer potential.
  141. template <class T, int newton_iter=0>
  142. void laplace_dbl_poten(T* r_src, int src_cnt, T* v_src, int dof, T* r_trg, int trg_cnt, T* k_out, mem::MemoryManager* mem_mgr);
  143. // Laplace grdient kernel.
  144. template <class T, int newton_iter=0>
  145. void laplace_grad(T* r_src, int src_cnt, T* v_src, int dof, T* r_trg, int trg_cnt, T* k_out, mem::MemoryManager* mem_mgr);
  146. //#ifdef PVFMM_QUAD_T
  147. //const Kernel<QuadReal_t> laplace_potn_q=BuildKernel<QuadReal_t, laplace_poten, laplace_dbl_poten>("laplace" , 3, std::pair<int,int>(1,1));
  148. //const Kernel<QuadReal_t> laplace_grad_q=BuildKernel<QuadReal_t, laplace_grad >("laplace_grad", 3, std::pair<int,int>(1,3));
  149. //#endif
  150. const Kernel<double > laplace_potn_d=BuildKernel<double , laplace_poten<double,2>, laplace_dbl_poten<double,2> >("laplace" , 3, std::pair<int,int>(1,1));
  151. const Kernel<double > laplace_grad_d=BuildKernel<double , laplace_grad <double,2> >("laplace_grad", 3, std::pair<int,int>(1,3),
  152. &laplace_potn_d, &laplace_potn_d, NULL, &laplace_potn_d, &laplace_potn_d, NULL, &laplace_potn_d, NULL);
  153. const Kernel<float > laplace_potn_f=BuildKernel<float , laplace_poten<float,1>, laplace_dbl_poten<float,1> >("laplace" , 3, std::pair<int,int>(1,1));
  154. const Kernel<float > laplace_grad_f=BuildKernel<float , laplace_grad <float,1> >("laplace_grad", 3, std::pair<int,int>(1,3),
  155. &laplace_potn_f, &laplace_potn_f, NULL, &laplace_potn_f, &laplace_potn_f, NULL, &laplace_potn_f, NULL);
  156. template<class T>
  157. struct LaplaceKernel{
  158. inline static const Kernel<T>& potn_ker();
  159. inline static const Kernel<T>& grad_ker();
  160. };
  161. //#ifdef PVFMM_QUAD_T
  162. //template<> const Kernel<QuadReal_t>& LaplaceKernel<QuadReal_t>::potn_ker(){ return laplace_potn_q; };
  163. //template<> const Kernel<QuadReal_t>& LaplaceKernel<QuadReal_t>::grad_ker(){ return laplace_grad_q; };
  164. //#endif
  165. template<> const Kernel<double>& LaplaceKernel<double>::potn_ker(){ return laplace_potn_d; };
  166. template<> const Kernel<double>& LaplaceKernel<double>::grad_ker(){ return laplace_grad_d; };
  167. template<> const Kernel<float>& LaplaceKernel<float>::potn_ker(){ return laplace_potn_f; };
  168. template<> const Kernel<float>& LaplaceKernel<float>::grad_ker(){ return laplace_grad_f; };
  169. ////////////////////////////////////////////////////////////////////////////////
  170. //////// STOKES KERNEL ////////
  171. ////////////////////////////////////////////////////////////////////////////////
  172. /**
  173. * \brief Green's function for the Stokes's equation. Kernel tensor
  174. * dimension = 3x3.
  175. */
  176. template <class T>
  177. void stokes_vel(T* r_src, int src_cnt, T* v_src_, int dof, T* r_trg, int trg_cnt, T* k_out, mem::MemoryManager* mem_mgr);
  178. template <class T>
  179. void stokes_sym_dip(T* r_src, int src_cnt, T* v_src, int dof, T* r_trg, int trg_cnt, T* k_out, mem::MemoryManager* mem_mgr);
  180. template <class T>
  181. void stokes_press(T* r_src, int src_cnt, T* v_src_, int dof, T* r_trg, int trg_cnt, T* k_out, mem::MemoryManager* mem_mgr);
  182. template <class T>
  183. void stokes_stress(T* r_src, int src_cnt, T* v_src_, int dof, T* r_trg, int trg_cnt, T* k_out, mem::MemoryManager* mem_mgr);
  184. template <class T>
  185. void stokes_grad(T* r_src, int src_cnt, T* v_src_, int dof, T* r_trg, int trg_cnt, T* k_out, mem::MemoryManager* mem_mgr);
  186. #ifndef __MIC__
  187. #ifdef USE_SSE
  188. template <>
  189. void stokes_vel<double>(double* r_src, int src_cnt, double* v_src_, int dof, double* r_trg, int trg_cnt, double* k_out, mem::MemoryManager* mem_mgr);
  190. template <>
  191. void stokes_press<double>(double* r_src, int src_cnt, double* v_src_, int dof, double* r_trg, int trg_cnt, double* k_out, mem::MemoryManager* mem_mgr);
  192. template <>
  193. void stokes_stress<double>(double* r_src, int src_cnt, double* v_src_, int dof, double* r_trg, int trg_cnt, double* k_out, mem::MemoryManager* mem_mgr);
  194. template <>
  195. void stokes_grad<double>(double* r_src, int src_cnt, double* v_src_, int dof, double* r_trg, int trg_cnt, double* k_out, mem::MemoryManager* mem_mgr);
  196. #endif
  197. #endif
  198. const Kernel<double> ker_stokes_vel =BuildKernel<double, stokes_vel, stokes_sym_dip>("stokes_vel" , 3, std::pair<int,int>(3,3));
  199. const Kernel<double> ker_stokes_press =BuildKernel<double, stokes_press >("stokes_press" , 3, std::pair<int,int>(3,1));
  200. const Kernel<double> ker_stokes_stress=BuildKernel<double, stokes_stress >("stokes_stress", 3, std::pair<int,int>(3,9));
  201. const Kernel<double> ker_stokes_grad =BuildKernel<double, stokes_grad >("stokes_grad" , 3, std::pair<int,int>(3,9));
  202. ////////////////////////////////////////////////////////////////////////////////
  203. //////// BIOT-SAVART KERNEL ////////
  204. ////////////////////////////////////////////////////////////////////////////////
  205. template <class T>
  206. void biot_savart(T* r_src, int src_cnt, T* v_src_, int dof, T* r_trg, int trg_cnt, T* k_out, mem::MemoryManager* mem_mgr);
  207. const Kernel<double> ker_biot_savart=BuildKernel<double, biot_savart>("biot_savart", 3, std::pair<int,int>(3,3));
  208. ////////////////////////////////////////////////////////////////////////////////
  209. //////// HELMHOLTZ KERNEL ////////
  210. ////////////////////////////////////////////////////////////////////////////////
  211. /**
  212. * \brief Green's function for the Helmholtz's equation. Kernel tensor
  213. * dimension = 2x2.
  214. */
  215. template <class T>
  216. void helmholtz_poten(T* r_src, int src_cnt, T* v_src, int dof, T* r_trg, int trg_cnt, T* k_out, mem::MemoryManager* mem_mgr);
  217. template <class T>
  218. void helmholtz_grad(T* r_src, int src_cnt, T* v_src, int dof, T* r_trg, int trg_cnt, T* k_out, mem::MemoryManager* mem_mgr);
  219. const Kernel<double> ker_helmholtz =BuildKernel<double, helmholtz_poten>("helmholtz" , 3, std::pair<int,int>(2,2));
  220. const Kernel<double> ker_helmholtz_grad=BuildKernel<double, helmholtz_grad >("helmholtz_grad", 3, std::pair<int,int>(2,6));
  221. }//end namespace
  222. #ifdef __INTEL_OFFLOAD
  223. #pragma offload_attribute(pop)
  224. #endif
  225. #include <kernel.txx>
  226. #endif //_PVFMM_FMM_KERNEL_HPP_