kernel.hpp 11 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307
  1. /**
  2. * \file kernel.hpp
  3. * \author Dhairya Malhotra, dhairya.malhotra@gmail.com
  4. * \date 12-20-2011
  5. * \brief This file contains the definition of the struct Kernel and also the
  6. * implementation of various kernels for FMM.
  7. */
  8. #include <string>
  9. #include <cstdlib>
  10. #include <pvfmm_common.hpp>
  11. #include <mem_mgr.hpp>
  12. #include <vector.hpp>
  13. #include <matrix.hpp>
  14. #ifndef _PVFMM_FMM_KERNEL_HPP_
  15. #define _PVFMM_FMM_KERNEL_HPP_
  16. namespace pvfmm{
  17. template <class T>
  18. struct Kernel{
  19. public:
  20. /**
  21. * \brief Evaluate potential due to source points at target coordinates.
  22. * \param[in] r_src Coordinates of source points.
  23. * \param[in] src_cnt Number of source points.
  24. * \param[in] v_src Strength of source points.
  25. * \param[in] r_trg Coordinates of target points.
  26. * \param[in] trg_cnt Number of target points.
  27. * \param[out] k_out Output array with potential values.
  28. */
  29. typedef void (*Ker_t)(T* r_src, int src_cnt, T* v_src, int dof,
  30. T* r_trg, int trg_cnt, T* k_out, mem::MemoryManager* mem_mgr);
  31. /**
  32. * \brief Constructor.
  33. */
  34. Kernel(Ker_t poten, Ker_t dbl_poten, const char* name, int dim_, std::pair<int,int> k_dim,
  35. size_t dev_poten=(size_t)NULL, size_t dev_dbl_poten=(size_t)NULL);
  36. /**
  37. * \brief Initialize the kernel.
  38. */
  39. void Initialize(bool verbose=false) const;
  40. /**
  41. * \brief Compute the transformation matrix (on the source strength vector)
  42. * to get potential at target coordinates due to sources at the given
  43. * coordinates.
  44. * \param[in] r_src Coordinates of source points.
  45. * \param[in] src_cnt Number of source points.
  46. * \param[in] r_trg Coordinates of target points.
  47. * \param[in] trg_cnt Number of target points.
  48. * \param[out] k_out Output array with potential values.
  49. */
  50. void BuildMatrix(T* r_src, int src_cnt,
  51. T* r_trg, int trg_cnt, T* k_out) const;
  52. int dim;
  53. int ker_dim[2];
  54. std::string ker_name;
  55. Ker_t ker_poten;
  56. Ker_t dbl_layer_poten;
  57. size_t dev_ker_poten;
  58. size_t dev_dbl_layer_poten;
  59. mutable bool init;
  60. mutable bool homogen;
  61. mutable Vector<T> src_scal;
  62. mutable Vector<T> trg_scal;
  63. mutable Vector<Permutation<T> > perm_vec;
  64. mutable const Kernel<T>* k_s2m;
  65. mutable const Kernel<T>* k_s2l;
  66. mutable const Kernel<T>* k_s2t;
  67. mutable const Kernel<T>* k_m2m;
  68. mutable const Kernel<T>* k_m2l;
  69. mutable const Kernel<T>* k_m2t;
  70. mutable const Kernel<T>* k_l2l;
  71. mutable const Kernel<T>* k_l2t;
  72. private:
  73. Kernel();
  74. };
  75. template<typename T, void (*A)(T*, int, T*, int, T*, int, T*, mem::MemoryManager* mem_mgr),
  76. void (*B)(T*, int, T*, int, T*, int, T*, mem::MemoryManager* mem_mgr)>
  77. Kernel<T> BuildKernel(const char* name, int dim, std::pair<int,int> k_dim,
  78. const Kernel<T>* k_s2m=NULL, const Kernel<T>* k_s2l=NULL, const Kernel<T>* k_s2t=NULL,
  79. const Kernel<T>* k_m2m=NULL, const Kernel<T>* k_m2l=NULL, const Kernel<T>* k_m2t=NULL,
  80. const Kernel<T>* k_l2l=NULL, const Kernel<T>* k_l2t=NULL){
  81. size_t dev_ker_poten ;
  82. size_t dev_dbl_layer_poten;
  83. #ifdef __INTEL_OFFLOAD
  84. #pragma offload target(mic:0)
  85. #endif
  86. {
  87. dev_ker_poten =(size_t)((typename Kernel<T>::Ker_t)A);
  88. dev_dbl_layer_poten=(size_t)((typename Kernel<T>::Ker_t)B);
  89. }
  90. Kernel<T> K(A, B, name, dim, k_dim,
  91. dev_ker_poten, dev_dbl_layer_poten);
  92. K.k_s2m=k_s2m;
  93. K.k_s2l=k_s2l;
  94. K.k_s2t=k_s2t;
  95. K.k_m2m=k_m2m;
  96. K.k_m2l=k_m2l;
  97. K.k_m2t=k_m2t;
  98. K.k_l2l=k_l2l;
  99. K.k_l2t=k_l2t;
  100. return K;
  101. }
  102. template<typename T, void (*A)(T*, int, T*, int, T*, int, T*, mem::MemoryManager* mem_mgr)>
  103. Kernel<T> BuildKernel(const char* name, int dim, std::pair<int,int> k_dim,
  104. const Kernel<T>* k_s2m=NULL, const Kernel<T>* k_s2l=NULL, const Kernel<T>* k_s2t=NULL,
  105. const Kernel<T>* k_m2m=NULL, const Kernel<T>* k_m2l=NULL, const Kernel<T>* k_m2t=NULL,
  106. const Kernel<T>* k_l2l=NULL, const Kernel<T>* k_l2t=NULL){
  107. size_t dev_ker_poten ;
  108. #ifdef __INTEL_OFFLOAD
  109. #pragma offload target(mic:0)
  110. #endif
  111. {
  112. dev_ker_poten =(size_t)((typename Kernel<T>::Ker_t)A);
  113. }
  114. Kernel<T> K(A, NULL, name, dim, k_dim,
  115. dev_ker_poten, (size_t)NULL);
  116. K.k_s2m=k_s2m;
  117. K.k_s2l=k_s2l;
  118. K.k_s2t=k_s2t;
  119. K.k_m2m=k_m2m;
  120. K.k_m2l=k_m2l;
  121. K.k_m2t=k_m2t;
  122. K.k_l2l=k_l2l;
  123. K.k_l2t=k_l2t;
  124. return K;
  125. }
  126. }//end namespace
  127. #ifdef __INTEL_OFFLOAD
  128. #pragma offload_attribute(push,target(mic))
  129. #endif
  130. namespace pvfmm{ // Predefined Kernel-functions
  131. ////////////////////////////////////////////////////////////////////////////////
  132. //////// LAPLACE KERNEL ////////
  133. ////////////////////////////////////////////////////////////////////////////////
  134. /**
  135. * \brief Green's function for the Poisson's equation. Kernel tensor
  136. * dimension = 1x1.
  137. */
  138. template <class T>
  139. void laplace_poten(T* r_src, int src_cnt, T* v_src, int dof, T* r_trg, int trg_cnt, T* k_out, mem::MemoryManager* mem_mgr);
  140. // Laplace double layer potential.
  141. template <class T>
  142. void laplace_dbl_poten(T* r_src, int src_cnt, T* v_src, int dof, T* r_trg, int trg_cnt, T* k_out, mem::MemoryManager* mem_mgr);
  143. // Laplace grdient kernel.
  144. template <class T>
  145. void laplace_grad(T* r_src, int src_cnt, T* v_src, int dof, T* r_trg, int trg_cnt, T* k_out, mem::MemoryManager* mem_mgr);
  146. #ifndef __MIC__
  147. #ifdef USE_SSE
  148. template <>
  149. void laplace_poten<double>(double* r_src, int src_cnt, double* v_src, int dof, double* r_trg, int trg_cnt, double* k_out, mem::MemoryManager* mem_mgr);
  150. template <>
  151. void laplace_dbl_poten<double>(double* r_src, int src_cnt, double* v_src, int dof, double* r_trg, int trg_cnt, double* k_out, mem::MemoryManager* mem_mgr);
  152. template <>
  153. void laplace_grad<double>(double* r_src, int src_cnt, double* v_src, int dof, double* r_trg, int trg_cnt, double* k_out, mem::MemoryManager* mem_mgr);
  154. #endif
  155. #endif
  156. //#ifdef PVFMM_QUAD_T
  157. //const Kernel<QuadReal_t> laplace_potn_q=BuildKernel<QuadReal_t, laplace_poten, laplace_dbl_poten>("laplace" , 3, std::pair<int,int>(1,1));
  158. //const Kernel<QuadReal_t> laplace_grad_q=BuildKernel<QuadReal_t, laplace_grad >("laplace_grad", 3, std::pair<int,int>(1,3));
  159. //#endif
  160. const Kernel<double > laplace_potn_d=BuildKernel<double , laplace_poten, laplace_dbl_poten>("laplace" , 3, std::pair<int,int>(1,1));
  161. const Kernel<double > laplace_grad_d=BuildKernel<double , laplace_grad >("laplace_grad", 3, std::pair<int,int>(1,3),
  162. &laplace_potn_d, &laplace_potn_d, NULL, &laplace_potn_d, &laplace_potn_d, NULL, &laplace_potn_d, NULL);
  163. const Kernel<float > laplace_potn_f=BuildKernel<float , laplace_poten, laplace_dbl_poten>("laplace" , 3, std::pair<int,int>(1,1));
  164. const Kernel<float > laplace_grad_f=BuildKernel<float , laplace_grad >("laplace_grad", 3, std::pair<int,int>(1,3),
  165. &laplace_potn_f, &laplace_potn_f, NULL, &laplace_potn_f, &laplace_potn_f, NULL, &laplace_potn_f, NULL);
  166. template<class T>
  167. struct LaplaceKernel{
  168. inline static const Kernel<T>& potn_ker();
  169. inline static const Kernel<T>& grad_ker();
  170. };
  171. //#ifdef PVFMM_QUAD_T
  172. //template<> const Kernel<QuadReal_t>& LaplaceKernel<QuadReal_t>::potn_ker(){ return laplace_potn_q; };
  173. //template<> const Kernel<QuadReal_t>& LaplaceKernel<QuadReal_t>::grad_ker(){ return laplace_grad_q; };
  174. //#endif
  175. template<> const Kernel<double>& LaplaceKernel<double>::potn_ker(){ return laplace_potn_d; };
  176. template<> const Kernel<double>& LaplaceKernel<double>::grad_ker(){ return laplace_grad_d; };
  177. template<> const Kernel<float>& LaplaceKernel<float>::potn_ker(){ return laplace_potn_f; };
  178. template<> const Kernel<float>& LaplaceKernel<float>::grad_ker(){ return laplace_grad_f; };
  179. ////////////////////////////////////////////////////////////////////////////////
  180. //////// STOKES KERNEL ////////
  181. ////////////////////////////////////////////////////////////////////////////////
  182. /**
  183. * \brief Green's function for the Stokes's equation. Kernel tensor
  184. * dimension = 3x3.
  185. */
  186. template <class T>
  187. void stokes_vel(T* r_src, int src_cnt, T* v_src_, int dof, T* r_trg, int trg_cnt, T* k_out, mem::MemoryManager* mem_mgr);
  188. template <class T>
  189. void stokes_sym_dip(T* r_src, int src_cnt, T* v_src, int dof, T* r_trg, int trg_cnt, T* k_out, mem::MemoryManager* mem_mgr);
  190. template <class T>
  191. void stokes_press(T* r_src, int src_cnt, T* v_src_, int dof, T* r_trg, int trg_cnt, T* k_out, mem::MemoryManager* mem_mgr);
  192. template <class T>
  193. void stokes_stress(T* r_src, int src_cnt, T* v_src_, int dof, T* r_trg, int trg_cnt, T* k_out, mem::MemoryManager* mem_mgr);
  194. template <class T>
  195. void stokes_grad(T* r_src, int src_cnt, T* v_src_, int dof, T* r_trg, int trg_cnt, T* k_out, mem::MemoryManager* mem_mgr);
  196. #ifndef __MIC__
  197. #ifdef USE_SSE
  198. template <>
  199. void stokes_vel<double>(double* r_src, int src_cnt, double* v_src_, int dof, double* r_trg, int trg_cnt, double* k_out, mem::MemoryManager* mem_mgr);
  200. template <>
  201. void stokes_press<double>(double* r_src, int src_cnt, double* v_src_, int dof, double* r_trg, int trg_cnt, double* k_out, mem::MemoryManager* mem_mgr);
  202. template <>
  203. void stokes_stress<double>(double* r_src, int src_cnt, double* v_src_, int dof, double* r_trg, int trg_cnt, double* k_out, mem::MemoryManager* mem_mgr);
  204. template <>
  205. void stokes_grad<double>(double* r_src, int src_cnt, double* v_src_, int dof, double* r_trg, int trg_cnt, double* k_out, mem::MemoryManager* mem_mgr);
  206. #endif
  207. #endif
  208. const Kernel<double> ker_stokes_vel =BuildKernel<double, stokes_vel, stokes_sym_dip>("stokes_vel" , 3, std::pair<int,int>(3,3));
  209. const Kernel<double> ker_stokes_press =BuildKernel<double, stokes_press >("stokes_press" , 3, std::pair<int,int>(3,1));
  210. const Kernel<double> ker_stokes_stress=BuildKernel<double, stokes_stress >("stokes_stress", 3, std::pair<int,int>(3,9));
  211. const Kernel<double> ker_stokes_grad =BuildKernel<double, stokes_grad >("stokes_grad" , 3, std::pair<int,int>(3,9));
  212. ////////////////////////////////////////////////////////////////////////////////
  213. //////// BIOT-SAVART KERNEL ////////
  214. ////////////////////////////////////////////////////////////////////////////////
  215. template <class T>
  216. void biot_savart(T* r_src, int src_cnt, T* v_src_, int dof, T* r_trg, int trg_cnt, T* k_out, mem::MemoryManager* mem_mgr);
  217. const Kernel<double> ker_biot_savart=BuildKernel<double, biot_savart>("biot_savart", 3, std::pair<int,int>(3,3));
  218. ////////////////////////////////////////////////////////////////////////////////
  219. //////// HELMHOLTZ KERNEL ////////
  220. ////////////////////////////////////////////////////////////////////////////////
  221. /**
  222. * \brief Green's function for the Helmholtz's equation. Kernel tensor
  223. * dimension = 2x2.
  224. */
  225. template <class T>
  226. void helmholtz_poten(T* r_src, int src_cnt, T* v_src, int dof, T* r_trg, int trg_cnt, T* k_out, mem::MemoryManager* mem_mgr);
  227. template <class T>
  228. void helmholtz_grad(T* r_src, int src_cnt, T* v_src, int dof, T* r_trg, int trg_cnt, T* k_out, mem::MemoryManager* mem_mgr);
  229. const Kernel<double> ker_helmholtz =BuildKernel<double, helmholtz_poten>("helmholtz" , 3, std::pair<int,int>(2,2));
  230. const Kernel<double> ker_helmholtz_grad=BuildKernel<double, helmholtz_grad >("helmholtz_grad", 3, std::pair<int,int>(2,6));
  231. }//end namespace
  232. #ifdef __INTEL_OFFLOAD
  233. #pragma offload_attribute(pop)
  234. #endif
  235. #include <kernel.txx>
  236. #endif //_PVFMM_FMM_KERNEL_HPP_