/************************************************************************************* Grid physics library, www.github.com/paboyle/Grid Source file: ./lib/qcd/action/fermion/WilsonKernelsAsmAvx512.h Copyright (C) 2015 Author: Peter Boyle Author: paboyle This program is free software; you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free Software Foundation; either version 2 of the License, or (at your option) any later version. This program is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details. You should have received a copy of the GNU General Public License along with this program; if not, write to the Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA. See the full license in the file "LICENSE" in the top level distribution directory *************************************************************************************/ /* END LEGAL */ #pragma once #if defined(AVX512) /////////////////////////////////////////////////////////// // If we are AVX512 specialise the single precision routine /////////////////////////////////////////////////////////// #include #include /// Switch off the 5d vectorised code optimisations #undef DWFVEC5D static std::vector signsF; template int setupSigns(std::vector& signs ){ std::vector bother(2); signs = bother; vrsign(signs[0]); visign(signs[1]); return 1; } static int signInitF = setupSigns(signsF); #define MAYBEPERM(A,perm) if (perm) { A ; } #define MULT_2SPIN(ptr,pf) MULT_ADDSUB_2SPIN(ptr,pf) #define COMPLEX_SIGNS(isigns) vComplexF *isigns = &signsF[0]; ///////////////////////////////////////////////////////////////// // XYZT vectorised, undag Kernel, single ///////////////////////////////////////////////////////////////// #undef KERNEL_DAG #define INTERIOR_AND_EXTERIOR #undef INTERIOR #undef EXTERIOR template<> void WilsonKernels::AsmDhopSite(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) #include template<> void WilsonKernels::AsmDhopSite(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) #include //template<> void //WilsonKernels::AsmDhopSite(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, // int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) //#include // //template<> void //WilsonKernels::AsmDhopSite(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, // int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) //#include #undef INTERIOR_AND_EXTERIOR #define INTERIOR #undef EXTERIOR template<> void WilsonKernels::AsmDhopSiteInt(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) #include template<> void WilsonKernels::AsmDhopSiteInt(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) #include //template<> void //WilsonKernels::AsmDhopSiteInt(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, // int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) //#include // //template<> void //WilsonKernels::AsmDhopSiteInt(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, // int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) //#include #undef INTERIOR_AND_EXTERIOR #undef INTERIOR #define EXTERIOR template<> void WilsonKernels::AsmDhopSiteExt(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) #include template<> void WilsonKernels::AsmDhopSiteExt(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) #include //template<> void //WilsonKernels::AsmDhopSiteExt(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, // int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) //#include // //template<> void //WilsonKernels::AsmDhopSiteExt(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, // int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) //#include ///////////////////////////////////////////////////////////////// // XYZT vectorised, dag Kernel, single ///////////////////////////////////////////////////////////////// #define KERNEL_DAG #define INTERIOR_AND_EXTERIOR #undef INTERIOR #undef EXTERIOR template<> void WilsonKernels::AsmDhopSiteDag(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) #include template<> void WilsonKernels::AsmDhopSiteDag(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) #include //template<> void //WilsonKernels::AsmDhopSiteDag(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, // int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) //#include // //template<> void //WilsonKernels::AsmDhopSiteDag(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, // int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) //#include #undef INTERIOR_AND_EXTERIOR #define INTERIOR #undef EXTERIOR template<> void WilsonKernels::AsmDhopSiteDagInt(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) #include template<> void WilsonKernels::AsmDhopSiteDagInt(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) #include //template<> void //WilsonKernels::AsmDhopSiteDagInt(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, // int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) //#include // //template<> void //WilsonKernels::AsmDhopSiteDagInt(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, // int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) //#include #undef INTERIOR_AND_EXTERIOR #undef INTERIOR #define EXTERIOR template<> void WilsonKernels::AsmDhopSiteDagExt(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) #include template<> void WilsonKernels::AsmDhopSiteDagExt(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) #include //template<> void //WilsonKernels::AsmDhopSiteDagExt(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, // int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) //#include // //template<> void //WilsonKernels::AsmDhopSiteDagExt(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, // int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) //#include #undef MAYBEPERM #undef MULT_2SPIN #define MAYBEPERM(A,B) #define MULT_2SPIN(ptr,pf) MULT_ADDSUB_2SPIN_LS(ptr,pf) ///////////////////////////////////////////////////////////////// // Ls vectorised, undag Kernel, single ///////////////////////////////////////////////////////////////// #ifdef DWFVEC5D #undef KERNEL_DAG #define INTERIOR_AND_EXTERIOR #undef INTERIOR #undef EXTERIOR template<> void WilsonKernels::AsmDhopSite(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) #include template<> void WilsonKernels::AsmDhopSite(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) #include //template<> void //WilsonKernels::AsmDhopSite(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, // int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) //#include //template<> void //WilsonKernels::AsmDhopSite(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, // int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) //#include #undef INTERIOR_AND_EXTERIOR #define INTERIOR #undef EXTERIOR template<> void WilsonKernels::AsmDhopSiteInt(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) #include template<> void WilsonKernels::AsmDhopSiteInt(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) #include //template<> void //WilsonKernels::AsmDhopSiteInt(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, // int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) //#include //template<> void //WilsonKernels::AsmDhopSiteInt(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, // int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) //#include #undef INTERIOR_AND_EXTERIOR #undef INTERIOR #define EXTERIOR #undef MULT_2SPIN #define MULT_2SPIN(ptr,pf) MULT_ADDSUB_2SPIN_LSNOPF(ptr,pf) template<> void WilsonKernels::AsmDhopSiteExt(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) #include template<> void WilsonKernels::AsmDhopSiteExt(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) #include //template<> void //WilsonKernels::AsmDhopSiteExt(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, // int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) //#include // //template<> void //WilsonKernels::AsmDhopSiteExt(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, // int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) //#include ///////////////////////////////////////////////////////////////// // Ls vectorised, dag Kernel, single ///////////////////////////////////////////////////////////////// #define KERNEL_DAG #define INTERIOR_AND_EXTERIOR #undef INTERIOR #undef EXTERIOR template<> void WilsonKernels::AsmDhopSiteDag(StencilView &st, DoubledGaugeFieldView &U,SiteHalfSpinor *buf, int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) #include template<> void WilsonKernels::AsmDhopSiteDag(StencilView &st, DoubledGaugeFieldView &U,SiteHalfSpinor *buf, int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) #include //template<> void //WilsonKernels::AsmDhopSiteDag(StencilView &st, DoubledGaugeFieldView &U,SiteHalfSpinor *buf, // int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) //#include //template<> void //WilsonKernels::AsmDhopSiteDag(StencilView &st, DoubledGaugeFieldView &U,SiteHalfSpinor *buf, // int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) //#include #undef INTERIOR_AND_EXTERIOR #define INTERIOR #undef EXTERIOR template<> void WilsonKernels::AsmDhopSiteDagInt(StencilView &st, DoubledGaugeFieldView &U,SiteHalfSpinor *buf, int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) #include template<> void WilsonKernels::AsmDhopSiteDagInt(StencilView &st, DoubledGaugeFieldView &U,SiteHalfSpinor *buf, int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) #include //template<> void //WilsonKernels::AsmDhopSiteDagInt(StencilView &st, DoubledGaugeFieldView &U,SiteHalfSpinor *buf, // int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) //#include //template<> void //WilsonKernels::AsmDhopSiteDagInt(StencilView &st, DoubledGaugeFieldView &U,SiteHalfSpinor *buf, // int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) //#include #undef INTERIOR_AND_EXTERIOR #undef INTERIOR #define EXTERIOR template<> void WilsonKernels::AsmDhopSiteDagExt(StencilView &st, DoubledGaugeFieldView &U,SiteHalfSpinor *buf, int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) #include template<> void WilsonKernels::AsmDhopSiteDagExt(StencilView &st, DoubledGaugeFieldView &U,SiteHalfSpinor *buf, int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) #include //template<> void //WilsonKernels::AsmDhopSiteDagExt(StencilView &st, DoubledGaugeFieldView &U,SiteHalfSpinor *buf, // int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) //#include //template<> void //WilsonKernels::AsmDhopSiteDagExt(StencilView &st, DoubledGaugeFieldView &U,SiteHalfSpinor *buf, // int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) //#include #endif // VEC 5D #undef COMPLEX_SIGNS #undef MAYBEPERM #undef MULT_2SPIN /////////////////////////////////////////////////////////// // If we are AVX512 specialise the double precision routine /////////////////////////////////////////////////////////// #include static std::vector signsD; static int signInitD = setupSigns(signsD); #define MAYBEPERM(A,perm) if (perm) { A ; } #define MULT_2SPIN(ptr,pf) MULT_ADDSUB_2SPIN(ptr,pf) #define COMPLEX_SIGNS(isigns) vComplexD *isigns = &signsD[0]; #define INTERIOR_AND_EXTERIOR #undef INTERIOR #undef EXTERIOR ///////////////////////////////////////////////////////////////// // XYZT vectorised, undag Kernel, single ///////////////////////////////////////////////////////////////// #undef KERNEL_DAG #define INTERIOR_AND_EXTERIOR #undef INTERIOR #undef EXTERIOR template<> void WilsonKernels::AsmDhopSite(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) #include template<> void WilsonKernels::AsmDhopSite(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) #include //template<> void //WilsonKernels::AsmDhopSite(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, // int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) //#include //template<> void //WilsonKernels::AsmDhopSite(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, // int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) //#include #undef INTERIOR_AND_EXTERIOR #define INTERIOR #undef EXTERIOR template<> void WilsonKernels::AsmDhopSiteInt(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) #include template<> void WilsonKernels::AsmDhopSiteInt(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) #include //template<> void //WilsonKernels::AsmDhopSiteInt(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, // int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) //#include //template<> void //WilsonKernels::AsmDhopSiteInt(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, // int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) //#include #undef INTERIOR_AND_EXTERIOR #undef INTERIOR #define EXTERIOR template<> void WilsonKernels::AsmDhopSiteExt(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) #include template<> void WilsonKernels::AsmDhopSiteExt(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) #include //template<> void //WilsonKernels::AsmDhopSiteExt(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, // int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) //#include //template<> void //WilsonKernels::AsmDhopSiteExt(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, // int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) //#include ///////////////////////////////////////////////////////////////// // XYZT vectorised, dag Kernel, single ///////////////////////////////////////////////////////////////// #define KERNEL_DAG #define INTERIOR_AND_EXTERIOR #undef INTERIOR #undef EXTERIOR template<> void WilsonKernels::AsmDhopSiteDag(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) #include template<> void WilsonKernels::AsmDhopSiteDag(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) #include //template<> void //WilsonKernels::AsmDhopSiteDag(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, // int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) //#include //template<> void //WilsonKernels::AsmDhopSiteDag(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, // int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) //#include #undef INTERIOR_AND_EXTERIOR #define INTERIOR #undef EXTERIOR template<> void WilsonKernels::AsmDhopSiteDagInt(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) #include template<> void WilsonKernels::AsmDhopSiteDagInt(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) #include //template<> void //WilsonKernels::AsmDhopSiteDagInt(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, // int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) //#include //template<> void //WilsonKernels::AsmDhopSiteDagInt(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, // int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) //#include #undef INTERIOR_AND_EXTERIOR #undef INTERIOR #define EXTERIOR template<> void WilsonKernels::AsmDhopSiteDagExt(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) #include template<> void WilsonKernels::AsmDhopSiteDagExt(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) #include //template<> void //WilsonKernels::AsmDhopSiteDagExt(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, // int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) //#include //template<> void //WilsonKernels::AsmDhopSiteDagExt(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, // int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) //#include #undef MAYBEPERM #undef MULT_2SPIN #define MAYBEPERM(A,B) #define MULT_2SPIN(ptr,pf) MULT_ADDSUB_2SPIN_LS(ptr,pf) ///////////////////////////////////////////////////////////////// // Ls vectorised, undag Kernel, single ///////////////////////////////////////////////////////////////// #ifdef DWFVEC5D #undef KERNEL_DAG #define INTERIOR_AND_EXTERIOR #undef INTERIOR #undef EXTERIOR template<> void WilsonKernels::AsmDhopSite(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) #include template<> void WilsonKernels::AsmDhopSite(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) #include //template<> void //WilsonKernels::AsmDhopSite(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, // int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) //#include //template<> void //WilsonKernels::AsmDhopSite(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, // int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) //#include #undef INTERIOR_AND_EXTERIOR #define INTERIOR #undef EXTERIOR template<> void WilsonKernels::AsmDhopSiteInt(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) #include template<> void WilsonKernels::AsmDhopSiteInt(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) #include //template<> void //WilsonKernels::AsmDhopSiteInt(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, // int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) //#include //template<> void //WilsonKernels::AsmDhopSiteInt(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, // int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) //#include #undef INTERIOR_AND_EXTERIOR #undef INTERIOR #define EXTERIOR #undef MULT_2SPIN #define MULT_2SPIN(ptr,pf) MULT_ADDSUB_2SPIN_LSNOPF(ptr,pf) template<> void WilsonKernels::AsmDhopSiteExt(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) #include template<> void WilsonKernels::AsmDhopSiteExt(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) #include //template<> void //WilsonKernels::AsmDhopSiteExt(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, // int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) //#include //template<> void //WilsonKernels::AsmDhopSiteExt(StencilView &st, DoubledGaugeFieldView &U, SiteHalfSpinor *buf, // int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) //#include ///////////////////////////////////////////////////////////////// // Ls vectorised, dag Kernel, single ///////////////////////////////////////////////////////////////// #define KERNEL_DAG #define INTERIOR_AND_EXTERIOR #undef INTERIOR #undef EXTERIOR template<> void WilsonKernels::AsmDhopSiteDag(StencilView &st, DoubledGaugeFieldView &U,SiteHalfSpinor *buf, int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) #include template<> void WilsonKernels::AsmDhopSiteDag(StencilView &st, DoubledGaugeFieldView &U,SiteHalfSpinor *buf, int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) #include //template<> void //WilsonKernels::AsmDhopSiteDag(StencilView &st, DoubledGaugeFieldView &U,SiteHalfSpinor *buf, // int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) //#include //template<> void //WilsonKernels::AsmDhopSiteDag(StencilView &st, DoubledGaugeFieldView &U,SiteHalfSpinor *buf, // int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) //#include #undef INTERIOR_AND_EXTERIOR #define INTERIOR #undef EXTERIOR template<> void WilsonKernels::AsmDhopSiteDagInt(StencilView &st, DoubledGaugeFieldView &U,SiteHalfSpinor *buf, int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) #include template<> void WilsonKernels::AsmDhopSiteDagInt(StencilView &st, DoubledGaugeFieldView &U,SiteHalfSpinor *buf, int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) #include //template<> void //WilsonKernels::AsmDhopSiteDagInt(StencilView &st, DoubledGaugeFieldView &U,SiteHalfSpinor *buf, // int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) //#include //template<> void //WilsonKernels::AsmDhopSiteDagInt(StencilView &st, DoubledGaugeFieldView &U,SiteHalfSpinor *buf, // int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) //#include #undef INTERIOR_AND_EXTERIOR #undef INTERIOR #define EXTERIOR template<> void WilsonKernels::AsmDhopSiteDagExt(StencilView &st, DoubledGaugeFieldView &U,SiteHalfSpinor *buf, int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) #include template<> void WilsonKernels::AsmDhopSiteDagExt(StencilView &st, DoubledGaugeFieldView &U,SiteHalfSpinor *buf, int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) #include //template<> void //WilsonKernels::AsmDhopSiteDagExt(StencilView &st, DoubledGaugeFieldView &U,SiteHalfSpinor *buf, // int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) //#include //template<> void //WilsonKernels::AsmDhopSiteDagExt(StencilView &st, DoubledGaugeFieldView &U,SiteHalfSpinor *buf, // int ss,int ssU,int Ls,int Ns,const FermionFieldView &in, FermionFieldView &out) //#include #endif // VEC 5D #undef COMPLEX_SIGNS #undef MAYBEPERM #undef MULT_2SPIN #undef Chi_00 #undef Chi_01 #undef Chi_02 #undef Chi_10 #undef Chi_11 #undef Chi_12 #undef Chi_20 #undef Chi_21 #undef Chi_22 #undef Chi_30 #undef Chi_31 #undef Chi_32 #undef UChi_00 #undef UChi_01 #undef UChi_02 #undef UChi_10 #undef UChi_11 #undef UChi_12 #undef UChi_20 #undef UChi_21 #undef UChi_22 #undef UChi_30 #undef UChi_31 #undef UChi_32 #undef Psi_00 #undef Psi_01 #undef Psi_02 #undef Psi_10 #undef Psi_11 #undef Psi_12 #undef Psi_20 #undef Psi_21 #undef Psi_22 #undef Psi_30 #undef Psi_31 #undef Psi_32 #undef Phi_00 #undef Phi_01 #undef Phi_02 #undef Phi_10 #undef Phi_11 #undef Phi_12 #undef Phi_20 #undef Phi_21 #undef Phi_22 #undef Phi_30 #undef Phi_31 #undef Phi_32 #endif //AVX512