//!NEW : added setFace(), domainWallDslashCuda() got an extra argument void DiracDomainWall::Dslash(cudaColorSpinorField &out, const cudaColorSpinorField &in, const QudaParity parity) const { if ( in.Ndim() != 5 || out.Ndim() != 5) errorQuda("Wrong number of dimensions\n"); checkParitySpinor(in, out); checkSpinorAlias(in, out); domainwall::setFace(face1,face2); // FIXME: temporary hack maintain C linkage for dslashCuda domainWallDslashCuda(&out, gauge, &in, parity, dagger, 0, mass, 0, commDim, profile); long long Ls = in.X(4); long long bulk = (Ls-2)*(in.Volume()/Ls); long long wall = 2*in.Volume()/Ls; flops += 1320LL*(long long)in.Volume() + 96LL*bulk + 120LL*wall; }
void DiracDomainWall::Dslash(cudaColorSpinorField &out, const cudaColorSpinorField &in, const QudaParity parity) const { if ( in.Ndim() != 5 || out.Ndim() != 5) errorQuda("Wrong number of dimensions\n"); if (!initDslash) initDslashConstants(gauge, in.Stride()); if (!initDomainWall) initDomainWallConstants(in.X(4)); checkParitySpinor(in, out); checkSpinorAlias(in, out); domainWallDslashCuda(&out, gauge, &in, parity, dagger, 0, mass, 0, tuneDslash); long long Ls = in.X(4); long long bulk = (Ls-2)*(in.Volume()/Ls); long long wall = 2*in.Volume()/Ls; flops += 1320LL*(long long)in.Volume() + 96LL*bulk + 120LL*wall; }
//!NEW : added setFace(), domainWallDslashCuda() got an extra argument void DiracDomainWall::DslashXpay(cudaColorSpinorField &out, const cudaColorSpinorField &in, const QudaParity parity, const cudaColorSpinorField &x, const double &k) const { if ( in.Ndim() != 5 || out.Ndim() != 5) errorQuda("Wrong number of dimensions\n"); checkParitySpinor(in, out); checkSpinorAlias(in, out); initSpinorConstants(in); setFace(face); // FIXME: temporary hack maintain C linkage for dslashCuda domainWallDslashCuda(&out, gauge, &in, parity, dagger, &x, mass, k, commDim); long long Ls = in.X(4); long long bulk = (Ls-2)*(in.Volume()/Ls); long long wall = 2*in.Volume()/Ls; flops += (1320LL+48LL)*(long long)in.Volume() + 96LL*bulk + 120LL*wall; }
void DiracDomainWall::Dslash(ColorSpinorField &out, const ColorSpinorField &in, const QudaParity parity) const { if ( in.Ndim() != 5 || out.Ndim() != 5) errorQuda("Wrong number of dimensions\n"); checkParitySpinor(in, out); checkSpinorAlias(in, out); if (checkLocation(out, in) == QUDA_CUDA_FIELD_LOCATION) { domainWallDslashCuda(&static_cast<cudaColorSpinorField&>(out), *gauge, &static_cast<const cudaColorSpinorField&>(in), parity, dagger, 0, mass, 0, commDim, profile); } else { errorQuda("Not implemented"); } long long Ls = in.X(4); long long bulk = (Ls-2)*(in.Volume()/Ls); long long wall = 2*in.Volume()/Ls; flops += 1320LL*(long long)in.Volume() + 96LL*bulk + 120LL*wall; }