kernel.hpp 9.0 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244
  1. /**
  2. * \file kernel.hpp
  3. * \author Dhairya Malhotra, dhairya.malhotra@gmail.com
  4. * \date 12-20-2011
  5. * \brief This file contains the definition of the struct Kernel and also the
  6. * implementation of various kernels for FMM.
  7. */
  8. #ifndef _PVFMM_FMM_KERNEL_HPP_
  9. #define _PVFMM_FMM_KERNEL_HPP_
  10. #include <pvfmm_common.hpp>
  11. #include <quad_utils.hpp>
  12. #include <mem_mgr.hpp>
  13. #include <string>
  14. namespace pvfmm{
  15. template <class T>
  16. struct Kernel{
  17. public:
  18. /**
  19. * \brief Evaluate potential due to source points at target coordinates.
  20. * \param[in] r_src Coordinates of source points.
  21. * \param[in] src_cnt Number of source points.
  22. * \param[in] v_src Strength of source points.
  23. * \param[in] r_trg Coordinates of target points.
  24. * \param[in] trg_cnt Number of target points.
  25. * \param[out] k_out Output array with potential values.
  26. */
  27. typedef void (*Ker_t)(T* r_src, int src_cnt, T* v_src, int dof,
  28. T* r_trg, int trg_cnt, T* k_out, mem::MemoryManager* mem_mgr);
  29. /**
  30. * \brief Constructor.
  31. */
  32. Kernel();
  33. /**
  34. * \brief Constructor.
  35. */
  36. Kernel(Ker_t poten, Ker_t dbl_poten, const char* name, int dim_,
  37. const int (&k_dim)[2], bool homogen_=false, T ker_scale=0,
  38. size_t dev_poten=(size_t)NULL, size_t dev_dbl_poten=(size_t)NULL);
  39. /**
  40. * \brief Compute the transformation matrix (on the source strength vector)
  41. * to get potential at target coordinates due to sources at the given
  42. * coordinates.
  43. * \param[in] r_src Coordinates of source points.
  44. * \param[in] src_cnt Number of source points.
  45. * \param[in] r_trg Coordinates of target points.
  46. * \param[in] trg_cnt Number of target points.
  47. * \param[out] k_out Output array with potential values.
  48. */
  49. void BuildMatrix(T* r_src, int src_cnt,
  50. T* r_trg, int trg_cnt, T* k_out);
  51. int dim;
  52. int ker_dim[2];
  53. Ker_t ker_poten;
  54. Ker_t dbl_layer_poten;
  55. size_t dev_ker_poten;
  56. size_t dev_dbl_layer_poten;
  57. bool homogen;
  58. T poten_scale;
  59. std::string ker_name;
  60. };
  61. template<typename T, void (*A)(T*, int, T*, int, T*, int, T*, mem::MemoryManager* mem_mgr),
  62. void (*B)(T*, int, T*, int, T*, int, T*, mem::MemoryManager* mem_mgr)>
  63. Kernel<T> BuildKernel(const char* name, int dim,
  64. const int (&k_dim)[2], bool homogen=false, T ker_scale=0){
  65. size_t dev_ker_poten ;
  66. size_t dev_dbl_layer_poten;
  67. #ifdef __INTEL_OFFLOAD
  68. #pragma offload target(mic:0)
  69. #endif
  70. {
  71. dev_ker_poten =(size_t)((typename Kernel<T>::Ker_t)A);
  72. dev_dbl_layer_poten=(size_t)((typename Kernel<T>::Ker_t)B);
  73. }
  74. return Kernel<T>(A, B,
  75. name, dim, k_dim, homogen, ker_scale,
  76. dev_ker_poten, dev_dbl_layer_poten);
  77. }
  78. template<typename T, void (*A)(T*, int, T*, int, T*, int, T*, mem::MemoryManager* mem_mgr)>
  79. Kernel<T> BuildKernel(const char* name, int dim,
  80. const int (&k_dim)[2], bool homogen=false, T ker_scale=0){
  81. size_t dev_ker_poten ;
  82. #ifdef __INTEL_OFFLOAD
  83. #pragma offload target(mic:0)
  84. #endif
  85. {
  86. dev_ker_poten =(size_t)((typename Kernel<T>::Ker_t)A);
  87. }
  88. return Kernel<T>(A, NULL,
  89. name, dim, k_dim, homogen, ker_scale,
  90. dev_ker_poten, (size_t)NULL);
  91. }
  92. }//end namespace
  93. #ifdef __INTEL_OFFLOAD
  94. #pragma offload_attribute(push,target(mic))
  95. #endif
  96. namespace pvfmm{ // Predefined Kernel-functions
  97. ////////////////////////////////////////////////////////////////////////////////
  98. //////// LAPLACE KERNEL ////////
  99. ////////////////////////////////////////////////////////////////////////////////
  100. /**
  101. * \brief Green's function for the Poisson's equation. Kernel tensor
  102. * dimension = 1x1.
  103. */
  104. template <class T>
  105. void laplace_poten(T* r_src, int src_cnt, T* v_src, int dof, T* r_trg, int trg_cnt, T* k_out, mem::MemoryManager* mem_mgr);
  106. // Laplace double layer potential.
  107. template <class T>
  108. void laplace_dbl_poten(T* r_src, int src_cnt, T* v_src, int dof, T* r_trg, int trg_cnt, T* k_out, mem::MemoryManager* mem_mgr);
  109. // Laplace grdient kernel.
  110. template <class T>
  111. void laplace_grad(T* r_src, int src_cnt, T* v_src, int dof, T* r_trg, int trg_cnt, T* k_out, mem::MemoryManager* mem_mgr);
  112. int dim_laplace_poten[2]={1,1};
  113. int dim_laplace_grad [2]={1,3};
  114. #ifdef QuadReal_t
  115. const Kernel<QuadReal_t> laplace_potn_q=BuildKernel<QuadReal_t, laplace_poten, laplace_dbl_poten>("laplace" , 3, dim_laplace_poten, true, 1.0);
  116. const Kernel<QuadReal_t> laplace_grad_q=BuildKernel<QuadReal_t, laplace_grad >("laplace_grad", 3, dim_laplace_grad , true, 2.0);
  117. #endif
  118. const Kernel<double > laplace_potn_d=BuildKernel<double , laplace_poten, laplace_dbl_poten>("laplace" , 3, dim_laplace_poten, true, 1.0);
  119. const Kernel<double > laplace_grad_d=BuildKernel<double , laplace_grad >("laplace_grad", 3, dim_laplace_grad , true, 2.0);
  120. const Kernel<float > laplace_potn_f=BuildKernel<float , laplace_poten, laplace_dbl_poten>("laplace" , 3, dim_laplace_poten, true, 1.0);
  121. const Kernel<float > laplace_grad_f=BuildKernel<float , laplace_grad >("laplace_grad", 3, dim_laplace_grad , true, 2.0);
  122. template<class T>
  123. struct LaplaceKernel{
  124. static Kernel<T>* potn_ker;
  125. static Kernel<T>* grad_ker;
  126. };
  127. #ifdef QuadReal_t
  128. template<> Kernel<QuadReal_t>* LaplaceKernel<QuadReal_t>::potn_ker=(Kernel<QuadReal_t>*)&laplace_potn_q;
  129. template<> Kernel<QuadReal_t>* LaplaceKernel<QuadReal_t>::grad_ker=(Kernel<QuadReal_t>*)&laplace_grad_q;
  130. #endif
  131. template<> Kernel<double>* LaplaceKernel<double>::potn_ker=(Kernel<double>*)&laplace_potn_d;
  132. template<> Kernel<double>* LaplaceKernel<double>::grad_ker=(Kernel<double>*)&laplace_grad_d;
  133. template<> Kernel<float>* LaplaceKernel<float>::potn_ker=(Kernel<float>*)&laplace_potn_f;
  134. template<> Kernel<float>* LaplaceKernel<float>::grad_ker=(Kernel<float>*)&laplace_grad_f;
  135. ////////////////////////////////////////////////////////////////////////////////
  136. //////// STOKES KERNEL ////////
  137. ////////////////////////////////////////////////////////////////////////////////
  138. /**
  139. * \brief Green's function for the Stokes's equation. Kernel tensor
  140. * dimension = 3x3.
  141. */
  142. template <class T>
  143. void stokes_vel(T* r_src, int src_cnt, T* v_src_, int dof, T* r_trg, int trg_cnt, T* k_out, mem::MemoryManager* mem_mgr);
  144. template <class T>
  145. void stokes_sym_dip(T* r_src, int src_cnt, T* v_src, int dof, T* r_trg, int trg_cnt, T* k_out, mem::MemoryManager* mem_mgr);
  146. template <class T>
  147. void stokes_press(T* r_src, int src_cnt, T* v_src_, int dof, T* r_trg, int trg_cnt, T* k_out, mem::MemoryManager* mem_mgr);
  148. template <class T>
  149. void stokes_stress(T* r_src, int src_cnt, T* v_src_, int dof, T* r_trg, int trg_cnt, T* k_out, mem::MemoryManager* mem_mgr);
  150. template <class T>
  151. void stokes_grad(T* r_src, int src_cnt, T* v_src_, int dof, T* r_trg, int trg_cnt, T* k_out, mem::MemoryManager* mem_mgr);
  152. int dim_stokes_vel [2]={3,3};
  153. const Kernel<double> ker_stokes_vel =BuildKernel<double, stokes_vel, stokes_sym_dip>("stokes_vel" , 3, dim_stokes_vel ,true,1.0);
  154. int dim_stokes_press [2]={3,1};
  155. const Kernel<double> ker_stokes_press =BuildKernel<double, stokes_press >("stokes_press" , 3, dim_stokes_press ,true,2.0);
  156. int dim_stokes_stress[2]={3,9};
  157. const Kernel<double> ker_stokes_stress=BuildKernel<double, stokes_stress >("stokes_stress", 3, dim_stokes_stress,true,2.0);
  158. int dim_stokes_grad [2]={3,9};
  159. const Kernel<double> ker_stokes_grad =BuildKernel<double, stokes_grad >("stokes_grad" , 3, dim_stokes_grad ,true,2.0);
  160. ////////////////////////////////////////////////////////////////////////////////
  161. //////// BIOT-SAVART KERNEL ////////
  162. ////////////////////////////////////////////////////////////////////////////////
  163. template <class T>
  164. void biot_savart(T* r_src, int src_cnt, T* v_src_, int dof, T* r_trg, int trg_cnt, T* k_out, mem::MemoryManager* mem_mgr);
  165. int dim_biot_savart[2]={3,3};
  166. const Kernel<double> ker_biot_savart=BuildKernel<double, biot_savart>("biot_savart", 3, dim_biot_savart,true,2.0);
  167. ////////////////////////////////////////////////////////////////////////////////
  168. //////// HELMHOLTZ KERNEL ////////
  169. ////////////////////////////////////////////////////////////////////////////////
  170. /**
  171. * \brief Green's function for the Helmholtz's equation. Kernel tensor
  172. * dimension = 2x2.
  173. */
  174. template <class T>
  175. void helmholtz_poten(T* r_src, int src_cnt, T* v_src, int dof, T* r_trg, int trg_cnt, T* k_out, mem::MemoryManager* mem_mgr);
  176. template <class T>
  177. void helmholtz_grad(T* r_src, int src_cnt, T* v_src, int dof, T* r_trg, int trg_cnt, T* k_out, mem::MemoryManager* mem_mgr);
  178. int dim_helmholtz [2]={2,2};
  179. const Kernel<double> ker_helmholtz =BuildKernel<double, helmholtz_poten>("helmholtz" , 3, dim_helmholtz );
  180. int dim_helmholtz_grad[2]={2,6};
  181. const Kernel<double> ker_helmholtz_grad=BuildKernel<double, helmholtz_grad >("helmholtz_grad", 3, dim_helmholtz_grad);
  182. }//end namespace
  183. #ifdef __INTEL_OFFLOAD
  184. #pragma offload_attribute(pop)
  185. #endif
  186. #include <kernel.txx>
  187. #endif //_PVFMM_FMM_KERNEL_HPP_