Created
August 17, 2018 14:59
-
-
Save iAbadia/529950f511e92a0d93ab6926fe2034be to your computer and use it in GitHub Desktop.
Benchmark_ITT gprof output.
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Flat profile: | |
Each sample counts as 0.01 seconds. | |
% cumulative self self total | |
time seconds seconds calls s/call s/call name | |
25.03 722.12 722.12 473465689 0.00 0.00 Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffComplexHalfComms> >::WilsonFermion5D(Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, 3> >, 4> >&, Grid::GridCartesian&, Grid::GridRedBlackCartesian&, Grid::GridCartesian&, Grid::GridRedBlackCartesian&, double, Grid::QCD::WilsonImplParams const&) | |
11.38 1050.49 328.37 32487566 0.00 0.00 Grid::QCD::WilsonKernels<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::HandDhopSiteInt(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >&, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >*, int, int, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&) | |
10.33 1348.49 298.00 28067609 0.00 0.00 Grid::QCD::WilsonKernels<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::GenericDhopSite(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >&, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >*, int, int, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&) | |
10.01 1637.34 288.85 33607682 0.00 0.00 Grid::QCD::WilsonKernels<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::HandDhopSite(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >&, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >*, int, int, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&) | |
9.71 1917.63 280.29 29677671 0.00 0.00 Grid::QCD::WilsonKernels<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::HandDhopSiteInt(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >&, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >*, int, int, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&) | |
8.77 2170.77 253.14 30706382 0.00 0.00 Grid::QCD::WilsonKernels<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::HandDhopSite(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >&, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >*, int, int, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&) | |
8.34 2411.47 240.70 21952384 0.00 0.00 Grid::QCD::WilsonKernels<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::GenericDhopSiteInt(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >&, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >*, int, int, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&) | |
6.89 2610.42 198.95 20202520 0.00 0.00 Grid::QCD::WilsonKernels<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::GenericDhopSite(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >&, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >*, int, int, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&) | |
6.72 2804.30 193.88 19253970 0.00 0.00 Grid::QCD::WilsonKernels<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::GenericDhopSiteInt(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >&, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >*, int, int, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&) | |
1.27 2840.88 36.58 Grid::QCD::DomainWallFermion<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::MomentumSpacePropagator(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, double) | |
0.17 2845.88 5.00 Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::CommunicateThreaded() | |
0.15 2850.32 4.44 36 0.12 0.31 Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::CartesianStencil(Grid::GridBase*, int, int, std::vector<int, std::allocator<int> > const&, std::vector<int, std::allocator<int> > const&) | |
0.14 2854.33 4.01 27861504 0.00 0.00 Grid::GridRedBlackCartesian::CheckerBoardFromOindex(int) | |
0.13 2858.17 3.84 Grid::QCD::FermionOperator<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::RedBlackGrid() | |
0.13 2861.92 3.75 88378312 0.00 0.00 Grid::permute(Grid::Grid_simd<std::complex<float>, __Float32x4_t>&, Grid::Grid_simd<std::complex<float>, __Float32x4_t>, int) | |
0.12 2865.52 3.60 Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffComplexHalfComms> >::Mdir(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, 3>, 4> > >&, int, int) | |
0.09 2868.12 2.61 32499663 0.00 0.00 std::vector<int, std::allocator<int> >::_M_default_append(unsigned long) | |
0.07 2870.01 1.89 778 0.00 0.00 frame_dummy | |
0.06 2871.85 1.84 __multf3 | |
0.06 2873.59 1.74 Grid::QCD::FermionOperator<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::MooDeriv(Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> >&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, int) | |
0.05 2875.08 1.49 std::enable_if<Grid::matchGridTensorIndex<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4>, 2>::value, Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >::type Grid::QCD::operator*<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >(Grid::QCD::Gamma const&, Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> const&) | |
0.05 2876.42 1.34 25 0.05 0.05 Grid::GridRNGbase::~GridRNGbase() | |
0.03 2877.40 0.98 32 0.03 0.03 void Grid::LatticeCoordinate<Grid::iScalar<Grid::Grid_simd<unsigned int, __Uint32x4_t> > >(Grid::Lattice<Grid::iScalar<Grid::Grid_simd<unsigned int, __Uint32x4_t> > >&, int) | |
0.03 2878.21 0.81 25 0.03 0.03 std::vector<std::discrete_distribution<int>, std::allocator<std::discrete_distribution<int> > >::_M_fill_insert(__gnu_cxx::__normal_iterator<std::discrete_distribution<int>*, std::vector<std::discrete_distribution<int>, std::allocator<std::discrete_distribution<int> > > >, unsigned long, std::discrete_distribution<int> const&) | |
0.02 2878.91 0.70 Benchmark::DWF(int, int, double&) | |
0.02 2879.56 0.65 844288 0.00 0.00 void Grid::peekLocalSite<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4>, Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 4> >(Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 4>&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> > const&, std::vector<int, std::allocator<int> >&) | |
0.02 2880.21 0.65 36 0.02 0.02 Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::BuildSurfaceList(int, int) | |
0.02 2880.86 0.65 __trunctfdf2 | |
0.02 2881.40 0.54 1560 0.00 0.00 Grid::QCD::CayleyFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffComplexHalfComms> >::M5D(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, std::vector<std::complex<double>, std::allocator<std::complex<double> > >&, std::vector<std::complex<double>, std::allocator<std::complex<double> > >&, std::vector<std::complex<double>, std::allocator<std::complex<double> > >&) | |
0.02 2881.88 0.48 __extenddftf2 | |
0.01 2882.27 0.39 180 0.00 0.00 Grid::alignedAllocator<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >::allocate(unsigned long, void const*) | |
0.01 2882.58 0.31 4 0.08 0.11 Grid::QCD::SpaceTimeGrid::makeFiveDimDWFRedBlackGrid(int, Grid::GridCartesian const*) | |
0.01 2882.86 0.28 8 0.04 0.05 Grid::QCD::SpaceTimeGrid::makeFiveDimRedBlackGrid(int, Grid::GridCartesian const*) | |
0.01 2883.13 0.27 Grid::QCD::WilsonKernels<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, Grid::QCD::TwoIndexRep<3, (Grid::QCD::TwoIndexSymmetry)1>, Grid::QCD::CoeffReal> >::ContractConservedCurrentSiteBwd(Grid::iScalar<Grid::iMatrix<Grid::iMatrix<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, 6>, 4> > const&, Grid::iScalar<Grid::iMatrix<Grid::iMatrix<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, 6>, 4> > const&, Grid::iScalar<Grid::iMatrix<Grid::iMatrix<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, 6>, 4> >&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, 6> >, 8> >&, unsigned int, unsigned int, bool) | |
0.01 2883.31 0.18 79152 0.00 0.00 Grid::LebesgueOrder::IterateI(int, int, std::vector<int, std::allocator<int> >&, std::vector<int, std::allocator<int> >&, std::vector<int, std::allocator<int> >&) | |
0.00 2883.45 0.14 1497897 0.00 0.00 Grid::GridBase::iIndex(std::vector<int, std::allocator<int> >&) | |
0.00 2883.59 0.14 1535850 0.00 0.00 Grid::GridBase::oIndex(std::vector<int, std::allocator<int> >&) | |
0.00 2883.72 0.13 422144 0.00 0.00 void Grid::pokeLocalSite<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8>, Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >(Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> const&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >&, std::vector<int, std::allocator<int> >&) | |
0.00 2883.85 0.13 424 0.00 0.00 Grid::alignedAllocator<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >::allocate(unsigned long, void const*) | |
0.00 2883.98 0.13 25 0.01 0.01 std::vector<std::normal_distribution<double>, std::allocator<std::normal_distribution<double> > >::_M_fill_insert(__gnu_cxx::__normal_iterator<std::normal_distribution<double>*, std::vector<std::normal_distribution<double>, std::allocator<std::normal_distribution<double> > > >, unsigned long, std::normal_distribution<double> const&) | |
0.00 2884.10 0.12 36 0.00 0.00 Grid::alignedAllocator<Grid::StencilEntry>::allocate(unsigned long, void const*) | |
0.00 2884.21 0.11 3377152 0.00 0.00 Grid::CartesianCommunicator::ProcessorCoorFromRank(int, std::vector<int, std::allocator<int> >&) | |
0.00 2884.31 0.10 410303 0.00 0.00 Grid::GridRedBlackCartesian::oIndex(std::vector<int, std::allocator<int> >&) | |
0.00 2884.40 0.09 625601 0.00 0.00 Grid::GridRedBlackCartesian::CheckerBoard(std::vector<int, std::allocator<int> > const&) | |
0.00 2884.49 0.09 296762 0.00 0.00 sitmo::prng_engine::encrypt_counter() | |
0.00 2884.58 0.09 Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > const Grid::predicatedWhere<Grid::Grid_simd<unsigned int, __Uint32x4_t> const&, Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > const, Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > const>(Grid::Grid_simd<unsigned int, __Uint32x4_t> const& const&, Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > const&, Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > const&) | |
0.00 2884.67 0.09 36 0.00 0.00 Grid::alignedAllocator<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> >::allocate(unsigned long, void const*) | |
0.00 2884.74 0.07 4 0.02 0.29 Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal>::DoubleStore(Grid::GridBase*, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> > const&) | |
0.00 2884.80 0.06 Grid::QCD::WilsonKernels<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::HandDhopSiteDag(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >&, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >*, int, int, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&) | |
0.00 2884.86 0.06 __divdc3 | |
0.00 2884.91 0.05 25 0.00 0.00 std::vector<std::uniform_int_distribution<unsigned int>, std::allocator<std::uniform_int_distribution<unsigned int> > >::_M_fill_insert(__gnu_cxx::__normal_iterator<std::uniform_int_distribution<unsigned int>*, std::vector<std::uniform_int_distribution<unsigned int>, std::allocator<std::uniform_int_distribution<unsigned int> > > >, unsigned long, std::uniform_int_distribution<unsigned int> const&) | |
0.00 2884.96 0.05 24 0.00 0.00 Grid::alignedAllocator<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >::allocate(unsigned long, void const*) | |
0.00 2885.01 0.05 Grid::Gather_plane_table_compute(Grid::GridBase*, int, int, int, int, std::vector<std::pair<int, int>, std::allocator<std::pair<int, int> > >&) | |
0.00 2885.06 0.05 Grid::QCD::WilsonKernels<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffComplex> >::HandDhopSiteDagExt(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, 3> >, 8> >&, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, 3>, 2> >*, int, int, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, 3>, 4> > >&) | |
0.00 2885.11 0.05 Grid::QCD::WilsonKernels<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::TwoIndexRep<3, (Grid::QCD::TwoIndexSymmetry)-1>, Grid::QCD::CoeffReal> >::DhopDir(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >&, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >*, int, int, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, int, int) | |
0.00 2885.15 0.04 33 0.00 0.00 Grid::alignedAllocator<Grid::iVector<Grid::Grid_simd<float, __Float32x4_t>, 8> >::allocate(unsigned long, void const*) | |
0.00 2885.19 0.04 25 0.00 0.00 std::vector<std::uniform_real_distribution<double>, std::allocator<std::uniform_real_distribution<double> > >::_M_fill_insert(__gnu_cxx::__normal_iterator<std::uniform_real_distribution<double>*, std::vector<std::uniform_real_distribution<double>, std::allocator<std::uniform_real_distribution<double> > > >, unsigned long, std::uniform_real_distribution<double> const&) | |
0.00 2885.23 0.04 16 0.00 0.01 Grid::QCD::SpaceTimeGrid::makeFourDimRedBlackGrid(Grid::GridCartesian const*) | |
0.00 2885.27 0.04 Grid::QCD::WilsonKernels<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::HandDhopSiteDag(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >&, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >*, int, int, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&) | |
0.00 2885.30 0.03 Grid::QCD::WilsonKernels<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::DhopDir(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >&, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >*, int, int, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, int, int) | |
0.00 2885.32 0.02 167755 0.00 0.00 Grid::Grid_simd<unsigned int, __Uint32x4_t> Grid::Comparison<Grid::seq<unsigned int, unsigned int>, Grid::Grid_simd<unsigned int, __Uint32x4_t>, 0>(Grid::seq<unsigned int, unsigned int>, Grid::Grid_simd<unsigned int, __Uint32x4_t> const&, Grid::Grid_simd<unsigned int, __Uint32x4_t>::scalar_type const&) | |
0.00 2885.34 0.02 112128 0.00 0.00 void Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::CommsMerge<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void> >(Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void>, std::vector<Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::Merge, std::allocator<Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::Merge> >&, std::vector<Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::Decompress, std::allocator<Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::Decompress> >&) | |
0.00 2885.36 0.02 12 0.00 0.00 Grid::alignedAllocator<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >::allocate(unsigned long, void const*) | |
0.00 2885.37 0.01 3585944 0.00 0.00 Grid::CartesianCommunicator::ThisRank() | |
0.00 2885.38 0.01 190280 0.00 0.00 Grid::CartesianCommunicator::RankFromProcessorCoor(std::vector<int, std::allocator<int> >&) | |
0.00 2885.39 0.01 19232 0.00 0.00 Grid::QCD::WilsonFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::DhopInternalOverlappedComms(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, int) | |
0.00 2885.40 0.01 54 0.00 0.00 std::vector<std::pair<int, int>, std::allocator<std::pair<int, int> > >::_M_default_append(unsigned long) | |
0.00 2885.41 0.01 16 0.00 0.00 void Grid::Copy_plane_permute<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, int, int, int, int, int) | |
0.00 2885.42 0.01 Grid::CartesianCommunicator::ShiftedRanks(int, int, int&, int&) | |
0.00 2885.43 0.01 Grid::CartesianCommunicator::BossRank() | |
0.00 2885.44 0.01 Benchmark::Memory() | |
0.00 2885.45 0.01 std::vector<std::vector<ompi_request_t*, std::allocator<ompi_request_t*> >, std::allocator<std::vector<ompi_request_t*, std::allocator<ompi_request_t*> > > >::~vector() | |
0.00 2885.45 0.01 24 0.00 0.00 Grid::GridParallelRNG::SeedFixedIntegers(std::vector<int, std::allocator<int> > const&) | |
0.00 2885.46 0.01 Grid::GridRedBlackCartesian::~GridRedBlackCartesian() | |
0.00 2885.46 0.01 std::ctype<char>::do_widen(char) const | |
0.00 2885.46 0.00 1266432 0.00 0.00 Grid::GridCartesian::CheckerBoard(std::vector<int, std::allocator<int> > const&) | |
0.00 2885.46 0.00 112128 0.00 0.00 Grid::CartesianCommunicator::StencilBarrier() | |
0.00 2885.46 0.00 56064 0.00 0.00 void Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::CommsMergeSHM<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void> >(Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void>) | |
0.00 2885.46 0.00 56064 0.00 0.00 int Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloGatherDir<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonTmProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonTmProjector, void>&, int, int&) | |
0.00 2885.46 0.00 56064 0.00 0.00 int Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloGatherDir<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonTpProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonTpProjector, void>&, int, int&) | |
0.00 2885.46 0.00 56064 0.00 0.00 int Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloGatherDir<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonXmProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonXmProjector, void>&, int, int&) | |
0.00 2885.46 0.00 56064 0.00 0.00 int Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloGatherDir<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonXpProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonXpProjector, void>&, int, int&) | |
0.00 2885.46 0.00 56064 0.00 0.00 int Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloGatherDir<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonYmProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonYmProjector, void>&, int, int&) | |
0.00 2885.46 0.00 56064 0.00 0.00 int Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloGatherDir<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonYpProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonYpProjector, void>&, int, int&) | |
0.00 2885.46 0.00 56064 0.00 0.00 int Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloGatherDir<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonZmProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonZmProjector, void>&, int, int&) | |
0.00 2885.46 0.00 56064 0.00 0.00 int Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloGatherDir<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonZpProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonZpProjector, void>&, int, int&) | |
0.00 2885.46 0.00 56064 0.00 0.00 Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::Prepare() | |
0.00 2885.46 0.00 38464 0.00 0.00 Grid::QCD::WilsonFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::DhopInternal(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, int) | |
0.00 2885.46 0.00 38432 0.00 0.00 Grid::QCD::WilsonFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::DhopEO(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, int) | |
0.00 2885.46 0.00 28032 0.00 0.00 void Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloGatherOpt<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void>&) | |
0.00 2885.46 0.00 28032 0.00 0.00 void Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloExchangeOpt<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void>&) | |
0.00 2885.46 0.00 19232 0.00 0.00 Grid::QCD::WilsonFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::DhopInternalSerialComms(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, int) | |
0.00 2885.46 0.00 17600 0.00 0.00 Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::DhopInternal(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, int) | |
0.00 2885.46 0.00 17600 0.00 0.00 Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::DhopEO(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, int) | |
0.00 2885.46 0.00 8800 0.00 0.00 Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::DhopInternalSerialComms(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, int) | |
0.00 2885.46 0.00 8800 0.00 0.00 Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::DhopInternalOverlappedComms(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, int) | |
0.00 2885.46 0.00 3206 0.00 0.00 Grid::GridCartesian::CheckerBoardShiftForCB(int, int, int, int) | |
0.00 2885.46 0.00 3024 0.00 0.00 Grid::GridRedBlackCartesian::CheckerBoardShiftForCB(int, int, int, int) | |
0.00 2885.46 0.00 2790 0.00 0.00 Grid::GridCartesian::CheckerBoarded(int) | |
0.00 2885.46 0.00 2640 0.00 0.00 Grid::GridRedBlackCartesian::CheckerBoarded(int) | |
0.00 2885.46 0.00 1325 0.00 0.00 Grid::PointerCache::Insert(void*, unsigned long) | |
0.00 2885.46 0.00 1325 0.00 0.00 Grid::PointerCache::Lookup(unsigned long) | |
0.00 2885.46 0.00 1040 0.00 0.00 Grid::LebesgueOrder::IterateO(int, int, std::vector<int, std::allocator<int> >&, std::vector<int, std::allocator<int> >&, std::vector<int, std::allocator<int> >&) | |
0.00 2885.46 0.00 824 0.00 0.00 void Grid::Copy_plane<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, int, int, int, int) | |
0.00 2885.46 0.00 672 0.00 0.00 Grid::CartesianCommunicator::GlobalSum(double&) | |
0.00 2885.46 0.00 620 0.00 0.00 void std::vector<int, std::allocator<int> >::_M_realloc_insert<int const&>(__gnu_cxx::__normal_iterator<int*, std::vector<int, std::allocator<int> > >, int const&) | |
0.00 2885.46 0.00 618 0.00 0.00 void Grid::Copy_plane<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >(Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >&, Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > > const&, int, int, int, int) | |
0.00 2885.46 0.00 432 0.00 0.00 Grid::alignedAllocator<Grid::iScalar<Grid::iScalar<Grid::iScalar<Grid::Grid_simd<std::complex<float>, __Float32x4_t> > > > >::deallocate(Grid::iScalar<Grid::iScalar<Grid::iScalar<Grid::Grid_simd<std::complex<float>, __Float32x4_t> > > >*, unsigned long) | |
0.00 2885.46 0.00 432 0.00 0.00 Grid::alignedAllocator<Grid::iScalar<Grid::iScalar<Grid::iScalar<Grid::Grid_simd<std::complex<float>, __Float32x4_t> > > > >::allocate(unsigned long, void const*) | |
0.00 2885.46 0.00 424 0.00 0.00 Grid::alignedAllocator<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >::deallocate(Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > >*, unsigned long) | |
0.00 2885.46 0.00 224 0.00 0.00 Grid::GridCartesian::CheckerBoardDestination(int, int, int) | |
0.00 2885.46 0.00 216 0.00 0.00 Grid::SharedMemory::ShmBufferMalloc(unsigned long) | |
0.00 2885.46 0.00 191 0.00 0.00 std::vector<int, std::allocator<int> >::operator=(std::vector<int, std::allocator<int> > const&) | |
0.00 2885.46 0.00 180 0.00 0.00 Grid::alignedAllocator<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >::deallocate(Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >*, unsigned long) | |
0.00 2885.46 0.00 144 0.00 0.00 Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::Report() | |
0.00 2885.46 0.00 144 0.00 0.00 Grid::CartesianCommunicator::Barrier() | |
0.00 2885.46 0.00 144 0.00 0.00 Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::Reporti(int) | |
0.00 2885.46 0.00 127 0.00 0.00 Grid::SharedMemory::ShmBufferFreeAll() | |
0.00 2885.46 0.00 120 0.00 0.00 std::vector<double, std::allocator<double> >::_M_default_append(unsigned long) | |
0.00 2885.46 0.00 120 0.00 0.00 std::vector<double, std::allocator<double> >::resize(unsigned long) | |
0.00 2885.46 0.00 116 0.00 0.00 Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >::Lattice(Grid::GridBase*) | |
0.00 2885.46 0.00 104 0.00 0.00 Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >::~Lattice() | |
0.00 2885.46 0.00 92 0.00 0.00 std::vector<void*, std::allocator<void*> >::_M_default_append(unsigned long) | |
0.00 2885.46 0.00 91 0.00 0.00 Grid::SharedMemory::SetCommunicator(ompi_communicator_t*) | |
0.00 2885.46 0.00 76 0.00 0.00 std::complex<double> Grid::innerProduct<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&) | |
0.00 2885.46 0.00 76 0.00 0.00 Grid::alignedAllocator<std::complex<double> >::deallocate(std::complex<double>*, unsigned long) | |
0.00 2885.46 0.00 76 0.00 0.00 Grid::alignedAllocator<std::complex<double> >::allocate(unsigned long, void const*) | |
0.00 2885.46 0.00 76 0.00 0.00 Grid::CartesianCommunicator::GlobalSumVector(double*, int) | |
0.00 2885.46 0.00 76 0.00 0.00 Grid::CartesianCommunicator::GlobalSum(std::complex<double>&) | |
0.00 2885.46 0.00 72 0.00 0.00 Grid::alignedAllocator<Grid::Grid_simd<unsigned int, __Uint32x4_t> >::deallocate(Grid::Grid_simd<unsigned int, __Uint32x4_t>*, unsigned long) | |
0.00 2885.46 0.00 72 0.00 0.00 Grid::alignedAllocator<Grid::Grid_simd<unsigned int, __Uint32x4_t> >::allocate(unsigned long, void const*) | |
0.00 2885.46 0.00 72 0.00 0.00 std::vector<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >*, std::allocator<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >*> >::_M_default_append(unsigned long) | |
0.00 2885.46 0.00 64 0.00 0.00 void Grid::Cshift_local<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, int, int, int) | |
0.00 2885.46 0.00 64 0.00 0.00 Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > Grid::Cshift<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, int, int) | |
0.00 2885.46 0.00 55 0.00 0.00 Grid::GridCmdVectorIntToString[abi:cxx11](std::vector<int, std::allocator<int> > const&) | |
0.00 2885.46 0.00 52 0.00 0.00 Grid::CartesianCommunicator::InitFromMPICommunicator(std::vector<int, std::allocator<int> > const&, ompi_communicator_t*) | |
0.00 2885.46 0.00 52 0.00 0.00 Grid::CartesianCommunicator::CartesianCommunicator(std::vector<int, std::allocator<int> > const&, Grid::CartesianCommunicator const&, int&) | |
0.00 2885.46 0.00 48 0.00 0.00 time_statistics::statistics(std::vector<double, std::allocator<double> >) | |
0.00 2885.46 0.00 48 0.00 0.00 void Grid::Cshift_local<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >(Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >&, Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > > const&, int, int, int) | |
0.00 2885.46 0.00 48 0.00 0.00 void Grid::QCD::SU<3>::LieRandomize<Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > > >(Grid::GridParallelRNG&, Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >&, double) | |
0.00 2885.46 0.00 48 0.00 0.00 Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > > Grid::Cshift<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >(Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > > const&, int, int) | |
0.00 2885.46 0.00 48 0.00 0.00 Grid::GridBase::PermuteType(int) | |
0.00 2885.46 0.00 48 0.00 0.00 std::vector<int, std::allocator<int> >::vector(std::vector<int, std::allocator<int> > const&) | |
0.00 2885.46 0.00 42 0.00 0.00 Grid::GridDefaultMpi() | |
0.00 2885.46 0.00 42 0.00 0.00 Grid::Grid_sa_signal_handler(int, siginfo_t*, void*) | |
0.00 2885.46 0.00 39 0.00 0.00 Grid::GlobalSharedMemory::OptimalCommunicator(std::vector<int, std::allocator<int> > const&, ompi_communicator_t*&) | |
0.00 2885.46 0.00 39 0.00 0.00 Grid::CartesianCommunicator::CartesianCommunicator(std::vector<int, std::allocator<int> > const&) | |
0.00 2885.46 0.00 36 0.00 0.00 Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::~CartesianStencil() | |
0.00 2885.46 0.00 36 0.00 0.00 Grid::alignedAllocator<Grid::StencilEntry>::deallocate(Grid::StencilEntry*, unsigned long) | |
0.00 2885.46 0.00 36 0.00 0.00 Grid::alignedAllocator<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> >::deallocate(Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4>*, unsigned long) | |
0.00 2885.46 0.00 36 0.00 0.00 Grid::CartesianCommunicator::BroadcastWorld(int, void*, int) | |
0.00 2885.46 0.00 36 0.00 0.00 std::vector<Grid::StencilEntry, Grid::alignedAllocator<Grid::StencilEntry> >::_M_default_append(unsigned long) | |
0.00 2885.46 0.00 36 0.00 0.00 void std::vector<double, std::allocator<double> >::_M_realloc_insert<double const&>(__gnu_cxx::__normal_iterator<double*, std::vector<double, std::allocator<double> > >, double const&) | |
0.00 2885.46 0.00 33 0.00 0.00 Grid::alignedAllocator<Grid::iVector<Grid::Grid_simd<float, __Float32x4_t>, 8> >::deallocate(Grid::iVector<Grid::Grid_simd<float, __Float32x4_t>, 8>*, unsigned long) | |
0.00 2885.46 0.00 32 0.00 0.00 Grid::CartesianCommunicator::Broadcast(int, void*, int) | |
0.00 2885.46 0.00 32 0.00 0.00 Grid::QCD::WilsonFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::ZeroCounters() | |
0.00 2885.46 0.00 32 0.00 0.00 Grid::QCD::WilsonFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::DhopOE(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, int) | |
0.00 2885.46 0.00 32 0.00 0.01 Grid::QCD::WilsonFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::Report() | |
0.00 2885.46 0.00 31 0.00 0.00 Grid::GridDefaultSimd(int, int) | |
0.00 2885.46 0.00 25 0.00 0.00 std::seed_seq::seed_seq<__gnu_cxx::__normal_iterator<int const*, std::vector<int, std::allocator<int> > > >(__gnu_cxx::__normal_iterator<int const*, std::vector<int, std::allocator<int> > >, __gnu_cxx::__normal_iterator<int const*, std::vector<int, std::allocator<int> > >) | |
0.00 2885.46 0.00 24 0.00 0.01 Grid::LebesgueOrder::CartesianBlocking() | |
0.00 2885.46 0.00 24 0.00 0.01 Grid::LebesgueOrder::LebesgueOrder(Grid::GridBase*) | |
0.00 2885.46 0.00 24 0.00 0.04 Grid::GridParallelRNG::GridParallelRNG(Grid::GridBase*) | |
0.00 2885.46 0.00 24 0.00 0.00 Grid::alignedAllocator<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >::deallocate(Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8>*, unsigned long) | |
0.00 2885.46 0.00 24 0.00 0.00 Grid::QCD::SpaceTimeGrid::makeFourDimGrid(std::vector<int, std::allocator<int> > const&, std::vector<int, std::allocator<int> > const&, std::vector<int, std::allocator<int> > const&) | |
0.00 2885.46 0.00 24 0.00 0.00 Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >::Lattice(Grid::GridBase*) | |
0.00 2885.46 0.00 23 0.00 0.00 Grid::SharedMemory::~SharedMemory() | |
0.00 2885.46 0.00 23 0.00 0.00 Grid::CartesianCommunicator::~CartesianCommunicator() | |
0.00 2885.46 0.00 22 0.00 0.00 char** std::__find_if<char**, __gnu_cxx::__ops::_Iter_equals_val<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > const> >(char**, char**, __gnu_cxx::__ops::_Iter_equals_val<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > const>, std::random_access_iterator_tag) | |
0.00 2885.46 0.00 20 0.00 0.00 Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >::Lattice(Grid::GridBase*) | |
0.00 2885.46 0.00 16 0.00 0.00 Grid::QCD::SpaceTimeGrid::makeFiveDimGrid(int, Grid::GridCartesian const*) | |
0.00 2885.46 0.00 16 0.00 0.00 Grid::QCD::CayleyFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::MooeeInternalCompute(int, int, std::vector<Grid::iScalar<Grid::iScalar<Grid::iScalar<Grid::Grid_simd<std::complex<float>, __Float32x4_t> > > >, Grid::alignedAllocator<Grid::iScalar<Grid::iScalar<Grid::iScalar<Grid::Grid_simd<std::complex<float>, __Float32x4_t> > > > > >&, std::vector<Grid::iScalar<Grid::iScalar<Grid::iScalar<Grid::Grid_simd<std::complex<float>, __Float32x4_t> > > >, Grid::alignedAllocator<Grid::iScalar<Grid::iScalar<Grid::iScalar<Grid::Grid_simd<std::complex<float>, __Float32x4_t> > > > > >&) | |
0.00 2885.46 0.00 16 0.00 0.00 Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::ZeroCounters() | |
0.00 2885.46 0.00 16 0.00 0.01 Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::Report() | |
0.00 2885.46 0.00 12 0.00 0.00 Grid::alignedAllocator<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >::deallocate(Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8>*, unsigned long) | |
0.00 2885.46 0.00 12 0.00 0.00 void Grid::Copy_plane_permute<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >(Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >&, Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > > const&, int, int, int, int, int) | |
0.00 2885.46 0.00 12 0.00 0.00 Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >::Lattice(Grid::GridBase*) | |
0.00 2885.46 0.00 12 0.00 0.00 std::vector<std::complex<float>, std::allocator<std::complex<float> > >::_M_fill_insert(__gnu_cxx::__normal_iterator<std::complex<float>*, std::vector<std::complex<float>, std::allocator<std::complex<float> > > >, unsigned long, std::complex<float> const&) | |
0.00 2885.46 0.00 8 0.00 0.14 Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal>::DoubleStore(Grid::GridBase*, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> > const&) | |
0.00 2885.46 0.00 8 0.00 0.00 Grid::QCD::SpaceTimeGrid::makeFiveDimDWFGrid(int, Grid::GridCartesian const*) | |
0.00 2885.46 0.00 8 0.00 0.00 Grid::QCD::WilsonKernels<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::WilsonKernels(Grid::QCD::WilsonImplParams const&) | |
0.00 2885.46 0.00 8 0.00 0.00 Grid::QCD::CayleyFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::SetCoefficientsTanh(Grid::Approx::zolotarev_data*, double, double) | |
0.00 2885.46 0.00 8 0.00 0.00 Grid::QCD::CayleyFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::SetCoefficientsInternal(double, std::vector<double, std::allocator<double> >&, double, double) | |
0.00 2885.46 0.00 8 0.00 1.14 Grid::QCD::CayleyFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::CayleyFermion5D(Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> >&, Grid::GridCartesian&, Grid::GridRedBlackCartesian&, Grid::GridCartesian&, Grid::GridRedBlackCartesian&, double, double, Grid::QCD::WilsonImplParams const&) | |
0.00 2885.46 0.00 8 0.00 0.00 Grid::QCD::CayleyFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::~CayleyFermion5D() | |
0.00 2885.46 0.00 8 0.00 0.14 Grid::QCD::WilsonFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::ImportGauge(Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> > const&) | |
0.00 2885.46 0.00 8 0.00 1.14 Grid::QCD::WilsonFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::WilsonFermion5D(Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> >&, Grid::GridCartesian&, Grid::GridRedBlackCartesian&, Grid::GridCartesian&, Grid::GridRedBlackCartesian&, double, Grid::QCD::WilsonImplParams const&) | |
0.00 2885.46 0.00 8 0.00 0.00 Grid::Approx::zolotarev_free(Grid::Approx::zolotarev_data*) | |
0.00 2885.46 0.00 8 0.00 0.00 Grid::Approx::higham(double, int) | |
0.00 2885.46 0.00 8 0.00 0.00 Grid::Approx::construct_contfrac(Grid::Approx::izd*) | |
0.00 2885.46 0.00 8 0.00 0.00 Grid::Approx::construct_partfrac(Grid::Approx::izd*) | |
0.00 2885.46 0.00 4 0.00 0.00 _GLOBAL__sub_I__ZN4Grid3QCD13SpaceTimeGrid15makeFourDimGridERKSt6vectorIiSaIiEES6_S6_ | |
0.00 2885.46 0.00 4 0.00 0.00 Grid::QCD::SpaceTimeGrid::makeFourDimDWFGrid(std::vector<int, std::allocator<int> > const&, std::vector<int, std::allocator<int> > const&) | |
0.00 2885.46 0.00 4 0.00 0.00 Grid::QCD::WilsonKernels<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::WilsonKernels(Grid::QCD::WilsonImplParams const&) | |
0.00 2885.46 0.00 4 0.00 0.29 Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::ImportGauge(Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> > const&) | |
0.00 2885.46 0.00 4 0.00 1.28 Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::WilsonFermion5D(Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> >&, Grid::GridCartesian&, Grid::GridRedBlackCartesian&, Grid::GridCartesian&, Grid::GridRedBlackCartesian&, double, Grid::QCD::WilsonImplParams const&) | |
0.00 2885.46 0.00 4 0.00 0.00 Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::~WilsonFermion5D() | |
0.00 2885.46 0.00 4 0.00 0.00 Grid::Approx::contfrac_A(double*, double*, double*, double*, int, int) | |
0.00 2885.46 0.00 3 0.00 0.00 void std::vector<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> >, std::allocator<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > > >::_M_realloc_insert<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > const&>(__gnu_cxx::__normal_iterator<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> >*, std::vector<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> >, std::allocator<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > > > >, std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > const&) | |
0.00 2885.46 0.00 3 0.00 0.00 std::_Rb_tree<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> >, std::pair<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > const, std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > >, std::_Select1st<std::pair<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > const, std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > > >, std::less<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > >, std::allocator<std::pair<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > const, std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > > > >::_M_erase(std::_Rb_tree_node<std::pair<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > const, std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > > >*) | |
0.00 2885.46 0.00 2 0.00 0.00 _GLOBAL__sub_I__ZN4Grid3QCD22StaggeredKernelsStatic3OptE | |
0.00 2885.46 0.00 2 0.00 0.00 _GLOBAL__sub_I__ZN4Grid3QCD5Gamma3gmuE | |
0.00 2885.46 0.00 2 0.00 0.00 Grid::Grid_quiesce_nodes() | |
0.00 2885.46 0.00 1 0.00 0.00 _GLOBAL__sub_I_L_list | |
0.00 2885.46 0.00 1 0.00 0.00 _GLOBAL__sub_I__ZN4Grid10GridThread8_threadsE | |
0.00 2885.46 0.00 1 0.00 0.00 _GLOBAL__sub_I__ZN4Grid13LebesgueOrder16UseLebesgueOrderE | |
0.00 2885.46 0.00 1 0.00 0.00 _GLOBAL__sub_I__ZN4Grid14MemoryProfiler5statsE | |
0.00 2885.46 0.00 1 0.00 0.00 _GLOBAL__sub_I__ZN4Grid18GlobalSharedMemory17MAX_MPI_SHM_BYTESE | |
0.00 2885.46 0.00 1 0.00 0.00 _GLOBAL__sub_I__ZN4Grid18GlobalSharedMemory4InitEP19ompi_communicator_t | |
0.00 2885.46 0.00 1 0.00 0.00 _GLOBAL__sub_I__ZN4Grid21CartesianCommunicator18CommunicatorPolicyE | |
0.00 2885.46 0.00 1 0.00 0.00 _GLOBAL__sub_I__ZN4Grid21CartesianCommunicator18communicator_worldE | |
0.00 2885.46 0.00 1 0.00 0.00 _GLOBAL__sub_I__ZN4Grid26Gather_plane_table_computeEPNS_8GridBaseEiiiiRSt6vectorISt4pairIiiESaIS4_EE | |
0.00 2885.46 0.00 1 0.00 0.00 _GLOBAL__sub_I__ZN4Grid3QCD13WilsonKernelsINS0_17GparityWilsonImplINS_9Grid_simdISt7complexIfE13__Float32x4_tEENS0_14FundamentalRepILi3EEENS0_9CoeffRealEEEE12HandDhopSiteERNS0_13WilsonStencilINS_7iVectorINSE_INSE_IS7_Li3EEELi4EEELi2EEENSE_INSE_ISF_Li2EEELi2EEEEERNS_13LebesgueOrderERNS_7LatticeINSE_INSE_INS_7iScalarINS_7iMatrixIS7_Li3EEEEELi8EEELi2EEEEEPSJ_iiRKNSO_ISH_EERSY_ | |
0.00 2885.46 0.00 1 0.00 0.00 _GLOBAL__sub_I__ZN4Grid3QCD19WilsonKernelsStatic3OptE | |
0.00 2885.46 0.00 1 0.00 0.00 _GLOBAL__sub_I__ZN4Grid3QCD21WilsonFermion5DStatic10directionsE | |
0.00 2885.46 0.00 1 0.00 0.00 _GLOBAL__sub_I__ZN4Grid8demangleB5cxx11EPKc | |
0.00 2885.46 0.00 1 0.00 0.00 _GLOBAL__sub_I__ZN4Grid9printHashEv | |
0.00 2885.46 0.00 1 0.00 0.00 __static_initialization_and_destruction_0(int, int) [clone .constprop.58] | |
0.00 2885.46 0.00 1 0.00 0.00 Grid::GridParseLayout(char**, int, std::vector<int, std::allocator<int> >&, std::vector<int, std::allocator<int> >&) | |
0.00 2885.46 0.00 1 0.00 0.00 Grid::GridCmdOptionCSL(std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> >, std::vector<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> >, std::allocator<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > > >&) | |
0.00 2885.46 0.00 1 0.00 0.00 Grid::GridLogConfigure(std::vector<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> >, std::allocator<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > > >&) | |
0.00 2885.46 0.00 1 0.00 0.00 Grid::GridLogTimestamp(int) | |
0.00 2885.46 0.00 1 0.00 0.00 Grid::GlobalSharedMemory::SharedMemoryAllocate(unsigned long, int) | |
0.00 2885.46 0.00 1 0.00 0.00 Grid::GlobalSharedMemory::Init(ompi_communicator_t*) | |
0.00 2885.46 0.00 1 0.00 0.00 Grid::CartesianCommunicator::Init(int*, char***) | |
0.00 2885.46 0.00 1 0.00 0.00 Grid::CartesianCommunicator::RankWorld() | |
0.00 2885.46 0.00 1 0.00 0.00 Grid::printHash() | |
0.00 2885.46 0.00 1 0.00 0.00 Grid::operator<<(std::ostream&, Grid::Logger&) [clone .constprop.140] | |
0.00 2885.46 0.00 1 0.00 0.00 std::_Rb_tree<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> >, std::pair<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > const, std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > >, std::_Select1st<std::pair<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > const, std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > > >, std::less<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > >, std::allocator<std::pair<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > const, std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > > > >::_M_get_insert_unique_pos(std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > const&) | |
0.00 2885.46 0.00 1 0.00 0.00 void std::__introsort_loop<__gnu_cxx::__normal_iterator<int*, std::vector<int, std::allocator<int> > >, long, __gnu_cxx::__ops::_Iter_comp_iter<std::less<int> > >(__gnu_cxx::__normal_iterator<int*, std::vector<int, std::allocator<int> > >, __gnu_cxx::__normal_iterator<int*, std::vector<int, std::allocator<int> > >, long, __gnu_cxx::__ops::_Iter_comp_iter<std::less<int> >) | |
% the percentage of the total running time of the | |
time program used by this function. | |
cumulative a running sum of the number of seconds accounted | |
seconds for by this function and those listed above it. | |
self the number of seconds accounted for by this | |
seconds function alone. This is the major sort for this | |
listing. | |
calls the number of times this function was invoked, if | |
this function is profiled, else blank. | |
self the average number of milliseconds spent in this | |
ms/call function per call, if this function is profiled, | |
else blank. | |
total the average number of milliseconds spent in this | |
ms/call function and its descendents per call, if this | |
function is profiled, else blank. | |
name the name of the function. This is the minor sort | |
for this listing. The index shows the location of | |
the function in the gprof listing. If the index is | |
in parenthesis it shows where it would appear in | |
the gprof listing if it were to be printed. | |
Copyright (C) 2012-2015 Free Software Foundation, Inc. | |
Copying and distribution of this file, with or without modification, | |
are permitted in any medium without royalty provided the copyright | |
notice and this notice are preserved. | |
Call graph (explanation follows) | |
granularity: each sample hit covers 2 byte(s) for 0.00% of 2885.46 seconds | |
index % time self children called name | |
1193 Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::CommunicateThreaded() [1] | |
[1] 53.3 5.00 1532.19 0+1193 Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::CommunicateThreaded() [1] | |
240.70 261.21 21952384/21952384 Grid::QCD::WilsonKernels<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::GenericDhopSiteInt(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >&, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >*, int, int, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&) [4] | |
193.88 227.74 19253970/19253970 Grid::QCD::WilsonKernels<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::GenericDhopSiteInt(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >&, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >*, int, int, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&) [6] | |
328.37 0.00 32487566/32487566 Grid::QCD::WilsonKernels<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::HandDhopSiteInt(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >&, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >*, int, int, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&) [7] | |
280.29 0.00 29677671/29677671 Grid::QCD::WilsonKernels<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::HandDhopSiteInt(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >&, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >*, int, int, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&) [10] | |
1193 Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::CommunicateThreaded() [1] | |
----------------------------------------------- | |
<spontaneous> | |
[2] 44.3 3.60 1275.86 Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffComplexHalfComms> >::Mdir(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, 3>, 4> > >&, int, int) [2] | |
198.95 233.70 20202520/20202520 Grid::QCD::WilsonKernels<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::GenericDhopSite(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >&, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >*, int, int, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&) [5] | |
298.00 3.22 28067609/28067609 Grid::QCD::WilsonKernels<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::GenericDhopSite(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >&, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >*, int, int, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&) [8] | |
288.85 0.00 33607682/33607682 Grid::QCD::WilsonKernels<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::HandDhopSite(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >&, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >*, int, int, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&) [9] | |
253.14 0.00 30706382/30706382 Grid::QCD::WilsonKernels<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::HandDhopSite(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >&, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >*, int, int, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&) [11] | |
----------------------------------------------- | |
227.74 0.00 149316963/473465689 Grid::QCD::WilsonKernels<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::GenericDhopSiteInt(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >&, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >*, int, int, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&) [6] | |
233.70 0.00 153229376/473465689 Grid::QCD::WilsonKernels<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::GenericDhopSite(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >&, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >*, int, int, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&) [5] | |
260.68 0.00 170919350/473465689 Grid::QCD::WilsonKernels<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::GenericDhopSiteInt(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >&, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >*, int, int, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&) [4] | |
[3] 25.0 722.12 0.00 473465689 Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffComplexHalfComms> >::WilsonFermion5D(Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, 3> >, 4> >&, Grid::GridCartesian&, Grid::GridRedBlackCartesian&, Grid::GridCartesian&, Grid::GridRedBlackCartesian&, double, Grid::QCD::WilsonImplParams const&) [3] | |
----------------------------------------------- | |
240.70 261.21 21952384/21952384 Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::CommunicateThreaded() [1] | |
[4] 17.4 240.70 261.21 21952384 Grid::QCD::WilsonKernels<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::GenericDhopSiteInt(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >&, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >*, int, int, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&) [4] | |
260.68 0.00 170919350/473465689 Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffComplexHalfComms> >::WilsonFermion5D(Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, 3> >, 4> >&, Grid::GridCartesian&, Grid::GridRedBlackCartesian&, Grid::GridCartesian&, Grid::GridRedBlackCartesian&, double, Grid::QCD::WilsonImplParams const&) [3] | |
0.53 0.00 12524980/88378312 Grid::permute(Grid::Grid_simd<std::complex<float>, __Float32x4_t>&, Grid::Grid_simd<std::complex<float>, __Float32x4_t>, int) [21] | |
----------------------------------------------- | |
198.95 233.70 20202520/20202520 Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffComplexHalfComms> >::Mdir(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, 3>, 4> > >&, int, int) [2] | |
[5] 15.0 198.95 233.70 20202520 Grid::QCD::WilsonKernels<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::GenericDhopSite(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >&, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >*, int, int, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&) [5] | |
233.70 0.00 153229376/473465689 Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffComplexHalfComms> >::WilsonFermion5D(Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, 3> >, 4> >&, Grid::GridCartesian&, Grid::GridRedBlackCartesian&, Grid::GridCartesian&, Grid::GridRedBlackCartesian&, double, Grid::QCD::WilsonImplParams const&) [3] | |
----------------------------------------------- | |
193.88 227.74 19253970/19253970 Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::CommunicateThreaded() [1] | |
[6] 14.6 193.88 227.74 19253970 Grid::QCD::WilsonKernels<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::GenericDhopSiteInt(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >&, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >*, int, int, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&) [6] | |
227.74 0.00 149316963/473465689 Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffComplexHalfComms> >::WilsonFermion5D(Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, 3> >, 4> >&, Grid::GridCartesian&, Grid::GridRedBlackCartesian&, Grid::GridCartesian&, Grid::GridRedBlackCartesian&, double, Grid::QCD::WilsonImplParams const&) [3] | |
----------------------------------------------- | |
328.37 0.00 32487566/32487566 Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::CommunicateThreaded() [1] | |
[7] 11.4 328.37 0.00 32487566 Grid::QCD::WilsonKernels<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::HandDhopSiteInt(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >&, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >*, int, int, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&) [7] | |
----------------------------------------------- | |
298.00 3.22 28067609/28067609 Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffComplexHalfComms> >::Mdir(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, 3>, 4> > >&, int, int) [2] | |
[8] 10.4 298.00 3.22 28067609 Grid::QCD::WilsonKernels<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::GenericDhopSite(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >&, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >*, int, int, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&) [8] | |
3.22 0.00 75853332/88378312 Grid::permute(Grid::Grid_simd<std::complex<float>, __Float32x4_t>&, Grid::Grid_simd<std::complex<float>, __Float32x4_t>, int) [21] | |
----------------------------------------------- | |
288.85 0.00 33607682/33607682 Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffComplexHalfComms> >::Mdir(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, 3>, 4> > >&, int, int) [2] | |
[9] 10.0 288.85 0.00 33607682 Grid::QCD::WilsonKernels<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::HandDhopSite(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >&, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >*, int, int, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&) [9] | |
----------------------------------------------- | |
280.29 0.00 29677671/29677671 Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::CommunicateThreaded() [1] | |
[10] 9.7 280.29 0.00 29677671 Grid::QCD::WilsonKernels<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::HandDhopSiteInt(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >&, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >*, int, int, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&) [10] | |
----------------------------------------------- | |
253.14 0.00 30706382/30706382 Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffComplexHalfComms> >::Mdir(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, 3>, 4> > >&, int, int) [2] | |
[11] 8.8 253.14 0.00 30706382 Grid::QCD::WilsonKernels<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::HandDhopSite(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >&, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >*, int, int, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&) [11] | |
----------------------------------------------- | |
<spontaneous> | |
[12] 1.3 36.58 0.00 Grid::QCD::DomainWallFermion<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::MomentumSpacePropagator(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, double) [12] | |
----------------------------------------------- | |
<spontaneous> | |
[13] 0.5 0.70 13.24 Benchmark::DWF(int, int, double&) [13] | |
0.00 9.13 8/8 Grid::QCD::CayleyFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::CayleyFermion5D(Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> >&, Grid::GridCartesian&, Grid::GridRedBlackCartesian&, Grid::GridCartesian&, Grid::GridRedBlackCartesian&, double, double, Grid::QCD::WilsonImplParams const&) [15] | |
1.20 0.05 496/778 frame_dummy [23] | |
0.86 0.00 16/25 Grid::GridRNGbase::~GridRNGbase() [27] | |
0.00 0.70 16/24 Grid::GridParallelRNG::GridParallelRNG(Grid::GridBase*) [33] | |
0.28 0.16 8/8 Grid::QCD::SpaceTimeGrid::makeFiveDimRedBlackGrid(int, Grid::GridCartesian const*) [41] | |
0.00 0.38 32/32 Grid::QCD::WilsonFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::Report() [43] | |
0.00 0.16 72/116 Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >::Lattice(Grid::GridBase*) [45] | |
0.00 0.15 64/64 Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > Grid::Cshift<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, int, int) [54] | |
0.02 0.02 8/16 Grid::QCD::SpaceTimeGrid::makeFourDimRedBlackGrid(Grid::GridCartesian const*) [67] | |
0.04 0.00 16/36 Grid::alignedAllocator<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> >::allocate(unsigned long, void const*) [66] | |
0.03 0.00 112/424 Grid::alignedAllocator<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >::allocate(unsigned long, void const*) [57] | |
0.00 0.03 32/48 void Grid::QCD::SU<3>::LieRandomize<Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > > >(Grid::GridParallelRNG&, Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >&, double) [76] | |
0.00 0.02 38464/38464 Grid::QCD::WilsonFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::DhopInternal(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, int) [83] | |
0.00 0.00 16/24 Grid::GridParallelRNG::SeedFixedIntegers(std::vector<int, std::allocator<int> > const&) [104] | |
0.00 0.00 16/24 Grid::QCD::SpaceTimeGrid::makeFourDimGrid(std::vector<int, std::allocator<int> > const&, std::vector<int, std::allocator<int> > const&, std::vector<int, std::allocator<int> > const&) [112] | |
0.00 0.00 8/16 Grid::QCD::SpaceTimeGrid::makeFiveDimGrid(int, Grid::GridCartesian const*) [113] | |
0.00 0.00 38432/38432 Grid::QCD::WilsonFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::DhopEO(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, int) [141] | |
0.00 0.00 136/180 Grid::alignedAllocator<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >::deallocate(Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >*, unsigned long) [158] | |
0.00 0.00 112/424 Grid::alignedAllocator<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >::deallocate(Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > >*, unsigned long) [154] | |
0.00 0.00 96/144 Grid::CartesianCommunicator::Barrier() [159] | |
0.00 0.00 72/76 std::complex<double> Grid::innerProduct<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&) [165] | |
0.00 0.00 72/104 Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >::~Lattice() [163] | |
0.00 0.00 32/55 Grid::GridCmdVectorIntToString[abi:cxx11](std::vector<int, std::allocator<int> > const&) [173] | |
0.00 0.00 32/32 Grid::QCD::WilsonFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::ZeroCounters() [187] | |
0.00 0.00 32/32 Grid::CartesianCommunicator::Broadcast(int, void*, int) [186] | |
0.00 0.00 32/48 time_statistics::statistics(std::vector<double, std::allocator<double> >) [174] | |
0.00 0.00 32/32 Grid::QCD::WilsonFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::DhopOE(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, int) [188] | |
0.00 0.00 24/42 Grid::GridDefaultMpi() [177] | |
0.00 0.00 24/36 void std::vector<double, std::allocator<double> >::_M_realloc_insert<double const&>(__gnu_cxx::__normal_iterator<double*, std::vector<double, std::allocator<double> > >, double const&) [184] | |
0.00 0.00 16/31 Grid::GridDefaultSimd(int, int) [189] | |
0.00 0.00 16/36 Grid::alignedAllocator<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> >::deallocate(Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4>*, unsigned long) [182] | |
0.00 0.00 8/12 std::vector<std::complex<float>, std::allocator<std::complex<float> > >::_M_fill_insert(__gnu_cxx::__normal_iterator<std::complex<float>*, std::vector<std::complex<float>, std::allocator<std::complex<float> > > >, unsigned long, std::complex<float> const&) [198] | |
0.00 0.00 8/8 Grid::Approx::higham(double, int) [204] | |
0.00 0.00 8/8 Grid::Approx::zolotarev_free(Grid::Approx::zolotarev_data*) [203] | |
0.00 0.00 8/8 Grid::QCD::CayleyFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::SetCoefficientsTanh(Grid::Approx::zolotarev_data*, double, double) [200] | |
0.00 0.00 8/8 Grid::QCD::CayleyFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::~CayleyFermion5D() [202] | |
----------------------------------------------- | |
1.48 2.20 12/36 Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::WilsonFermion5D(Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> >&, Grid::GridCartesian&, Grid::GridRedBlackCartesian&, Grid::GridCartesian&, Grid::GridRedBlackCartesian&, double, Grid::QCD::WilsonImplParams const&) [19] | |
2.96 4.39 24/36 Grid::QCD::WilsonFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::WilsonFermion5D(Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> >&, Grid::GridCartesian&, Grid::GridRedBlackCartesian&, Grid::GridCartesian&, Grid::GridRedBlackCartesian&, double, Grid::QCD::WilsonImplParams const&) [16] | |
[14] 0.4 4.44 6.59 36 Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::CartesianStencil(Grid::GridBase*, int, int, std::vector<int, std::allocator<int> > const&, std::vector<int, std::allocator<int> > const&) [14] | |
4.01 2.46 27861504/27861504 Grid::GridRedBlackCartesian::CheckerBoardFromOindex(int) [18] | |
0.00 0.12 36/36 std::vector<Grid::StencilEntry, Grid::alignedAllocator<Grid::StencilEntry> >::_M_default_append(unsigned long) [60] | |
0.00 0.00 3024/3024 Grid::GridRedBlackCartesian::CheckerBoardShiftForCB(int, int, int, int) [145] | |
0.00 0.00 2640/2640 Grid::GridRedBlackCartesian::CheckerBoarded(int) [147] | |
0.00 0.00 1512/3206 Grid::GridCartesian::CheckerBoardShiftForCB(int, int, int, int) [144] | |
0.00 0.00 1320/2790 Grid::GridCartesian::CheckerBoarded(int) [146] | |
0.00 0.00 216/216 Grid::SharedMemory::ShmBufferMalloc(unsigned long) [156] | |
0.00 0.00 72/191 std::vector<int, std::allocator<int> >::operator=(std::vector<int, std::allocator<int> > const&) [157] | |
0.00 0.00 72/72 std::vector<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >*, std::allocator<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >*> >::_M_default_append(unsigned long) [172] | |
0.00 0.00 36/127 Grid::SharedMemory::ShmBufferFreeAll() [160] | |
----------------------------------------------- | |
0.00 9.13 8/8 Benchmark::DWF(int, int, double&) [13] | |
[15] 0.3 0.00 9.13 8 Grid::QCD::CayleyFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::CayleyFermion5D(Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> >&, Grid::GridCartesian&, Grid::GridRedBlackCartesian&, Grid::GridCartesian&, Grid::GridRedBlackCartesian&, double, double, Grid::QCD::WilsonImplParams const&) [15] | |
0.00 9.13 8/8 Grid::QCD::WilsonFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::WilsonFermion5D(Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> >&, Grid::GridCartesian&, Grid::GridRedBlackCartesian&, Grid::GridCartesian&, Grid::GridRedBlackCartesian&, double, Grid::QCD::WilsonImplParams const&) [16] | |
----------------------------------------------- | |
0.00 9.13 8/8 Grid::QCD::CayleyFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::CayleyFermion5D(Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> >&, Grid::GridCartesian&, Grid::GridRedBlackCartesian&, Grid::GridCartesian&, Grid::GridRedBlackCartesian&, double, double, Grid::QCD::WilsonImplParams const&) [15] | |
[16] 0.3 0.00 9.13 8 Grid::QCD::WilsonFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::WilsonFermion5D(Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> >&, Grid::GridCartesian&, Grid::GridRedBlackCartesian&, Grid::GridCartesian&, Grid::GridRedBlackCartesian&, double, Grid::QCD::WilsonImplParams const&) [16] | |
2.96 4.39 24/36 Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::CartesianStencil(Grid::GridBase*, int, int, std::vector<int, std::allocator<int> > const&, std::vector<int, std::allocator<int> > const&) [14] | |
0.00 1.16 8/8 Grid::QCD::WilsonFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::ImportGauge(Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> > const&) [28] | |
0.43 0.00 24/36 Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::BuildSurfaceList(int, int) [36] | |
0.00 0.12 16/24 Grid::LebesgueOrder::LebesgueOrder(Grid::GridBase*) [53] | |
0.00 0.05 24/24 Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >::Lattice(Grid::GridBase*) [72] | |
0.00 0.02 8/116 Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >::Lattice(Grid::GridBase*) [45] | |
0.00 0.00 8/8 Grid::QCD::WilsonKernels<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::WilsonKernels(Grid::QCD::WilsonImplParams const&) [199] | |
----------------------------------------------- | |
<spontaneous> | |
[17] 0.3 0.00 7.29 Benchmark::DWF5(int, int) [17] | |
0.00 5.14 4/4 Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::WilsonFermion5D(Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> >&, Grid::GridCartesian&, Grid::GridRedBlackCartesian&, Grid::GridCartesian&, Grid::GridRedBlackCartesian&, double, Grid::QCD::WilsonImplParams const&) [19] | |
0.55 0.02 228/778 frame_dummy [23] | |
0.31 0.15 4/4 Grid::QCD::SpaceTimeGrid::makeFiveDimDWFRedBlackGrid(int, Grid::GridCartesian const*) [40] | |
0.43 0.00 8/25 Grid::GridRNGbase::~GridRNGbase() [27] | |
0.00 0.35 8/24 Grid::GridParallelRNG::GridParallelRNG(Grid::GridBase*) [33] | |
0.00 0.19 16/16 Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::Report() [48] | |
0.00 0.07 32/116 Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >::Lattice(Grid::GridBase*) [45] | |
0.02 0.02 8/16 Grid::QCD::SpaceTimeGrid::makeFourDimRedBlackGrid(Grid::GridCartesian const*) [67] | |
0.00 0.01 16/48 void Grid::QCD::SU<3>::LieRandomize<Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > > >(Grid::GridParallelRNG&, Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >&, double) [76] | |
0.01 0.00 4/36 Grid::alignedAllocator<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> >::allocate(unsigned long, void const*) [66] | |
0.00 0.01 17600/17600 Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::DhopInternal(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, int) [101] | |
0.00 0.00 8/24 Grid::GridParallelRNG::SeedFixedIntegers(std::vector<int, std::allocator<int> > const&) [104] | |
0.00 0.00 4/424 Grid::alignedAllocator<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >::allocate(unsigned long, void const*) [57] | |
0.00 0.00 8/24 Grid::QCD::SpaceTimeGrid::makeFourDimGrid(std::vector<int, std::allocator<int> > const&, std::vector<int, std::allocator<int> > const&, std::vector<int, std::allocator<int> > const&) [112] | |
0.00 0.00 4/4 Grid::QCD::SpaceTimeGrid::makeFourDimDWFGrid(std::vector<int, std::allocator<int> > const&, std::vector<int, std::allocator<int> > const&) [118] | |
0.00 0.00 4/8 Grid::QCD::SpaceTimeGrid::makeFiveDimDWFGrid(int, Grid::GridCartesian const*) [114] | |
0.00 0.00 17600/17600 Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::DhopEO(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, int) [143] | |
0.00 0.00 48/144 Grid::CartesianCommunicator::Barrier() [159] | |
0.00 0.00 32/180 Grid::alignedAllocator<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >::deallocate(Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >*, unsigned long) [158] | |
0.00 0.00 32/104 Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >::~Lattice() [163] | |
0.00 0.00 16/42 Grid::GridDefaultMpi() [177] | |
0.00 0.00 16/55 Grid::GridCmdVectorIntToString[abi:cxx11](std::vector<int, std::allocator<int> > const&) [173] | |
0.00 0.00 16/16 Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::ZeroCounters() [196] | |
0.00 0.00 16/48 time_statistics::statistics(std::vector<double, std::allocator<double> >) [174] | |
0.00 0.00 12/36 void std::vector<double, std::allocator<double> >::_M_realloc_insert<double const&>(__gnu_cxx::__normal_iterator<double*, std::vector<double, std::allocator<double> > >, double const&) [184] | |
0.00 0.00 8/31 Grid::GridDefaultSimd(int, int) [189] | |
0.00 0.00 4/76 std::complex<double> Grid::innerProduct<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&) [165] | |
0.00 0.00 4/424 Grid::alignedAllocator<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >::deallocate(Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > >*, unsigned long) [154] | |
0.00 0.00 4/12 std::vector<std::complex<float>, std::allocator<std::complex<float> > >::_M_fill_insert(__gnu_cxx::__normal_iterator<std::complex<float>*, std::vector<std::complex<float>, std::allocator<std::complex<float> > > >, unsigned long, std::complex<float> const&) [198] | |
0.00 0.00 4/4 Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::~WilsonFermion5D() [209] | |
0.00 0.00 4/36 Grid::alignedAllocator<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> >::deallocate(Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4>*, unsigned long) [182] | |
----------------------------------------------- | |
4.01 2.46 27861504/27861504 Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::CartesianStencil(Grid::GridBase*, int, int, std::vector<int, std::allocator<int> > const&, std::vector<int, std::allocator<int> > const&) [14] | |
[18] 0.2 4.01 2.46 27861504 Grid::GridRedBlackCartesian::CheckerBoardFromOindex(int) [18] | |
2.23 0.23 27861504/32499663 std::vector<int, std::allocator<int> >::_M_default_append(unsigned long) [22] | |
----------------------------------------------- | |
0.00 5.14 4/4 Benchmark::DWF5(int, int) [17] | |
[19] 0.2 0.00 5.14 4 Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::WilsonFermion5D(Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> >&, Grid::GridCartesian&, Grid::GridRedBlackCartesian&, Grid::GridCartesian&, Grid::GridRedBlackCartesian&, double, Grid::QCD::WilsonImplParams const&) [19] | |
1.48 2.20 12/36 Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::CartesianStencil(Grid::GridBase*, int, int, std::vector<int, std::allocator<int> > const&, std::vector<int, std::allocator<int> > const&) [14] | |
0.00 1.15 4/4 Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::ImportGauge(Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> > const&) [29] | |
0.22 0.00 12/36 Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::BuildSurfaceList(int, int) [36] | |
0.00 0.06 8/24 Grid::LebesgueOrder::LebesgueOrder(Grid::GridBase*) [53] | |
0.00 0.02 12/12 Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >::Lattice(Grid::GridBase*) [88] | |
0.00 0.01 4/116 Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >::Lattice(Grid::GridBase*) [45] | |
0.00 0.00 4/4 Grid::QCD::WilsonKernels<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::WilsonKernels(Grid::QCD::WilsonImplParams const&) [208] | |
----------------------------------------------- | |
<spontaneous> | |
[20] 0.1 3.84 0.00 Grid::QCD::FermionOperator<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::RedBlackGrid() [20] | |
----------------------------------------------- | |
0.53 0.00 12524980/88378312 Grid::QCD::WilsonKernels<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::GenericDhopSiteInt(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >&, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >*, int, int, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&) [4] | |
3.22 0.00 75853332/88378312 Grid::QCD::WilsonKernels<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::GenericDhopSite(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >&, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >*, int, int, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&) [8] | |
[21] 0.1 3.75 0.00 88378312 Grid::permute(Grid::Grid_simd<std::complex<float>, __Float32x4_t>&, Grid::Grid_simd<std::complex<float>, __Float32x4_t>, int) [21] | |
----------------------------------------------- | |
923818 std::vector<int, std::allocator<int> >::_M_default_append(unsigned long) [22] | |
0.00 0.00 2/32499663 Grid::GlobalSharedMemory::Init(ompi_communicator_t*) [120] | |
0.00 0.00 32/32499663 void Grid::LatticeCoordinate<Grid::iScalar<Grid::Grid_simd<unsigned int, __Uint32x4_t> > >(Grid::Lattice<Grid::iScalar<Grid::Grid_simd<unsigned int, __Uint32x4_t> > >&, int) [32] | |
0.00 0.00 39/32499663 Grid::CartesianCommunicator::CartesianCommunicator(std::vector<int, std::allocator<int> > const&) [117] | |
0.00 0.00 48/32499663 Grid::QCD::SpaceTimeGrid::makeFourDimDWFGrid(std::vector<int, std::allocator<int> > const&, std::vector<int, std::allocator<int> > const&) [118] | |
0.00 0.00 52/32499663 Grid::CartesianCommunicator::InitFromMPICommunicator(std::vector<int, std::allocator<int> > const&, ompi_communicator_t*) [119] | |
0.00 0.00 91/32499663 Grid::SharedMemory::SetCommunicator(ompi_communicator_t*) [116] | |
0.00 0.00 96/32499663 Grid::QCD::SpaceTimeGrid::makeFiveDimDWFGrid(int, Grid::GridCartesian const*) [114] | |
0.00 0.00 132/32499663 Benchmark::Memory() [49] | |
0.00 0.00 192/32499663 Grid::QCD::SpaceTimeGrid::makeFiveDimGrid(int, Grid::GridCartesian const*) [113] | |
0.00 0.00 288/32499663 Grid::QCD::SpaceTimeGrid::makeFourDimGrid(std::vector<int, std::allocator<int> > const&, std::vector<int, std::allocator<int> > const&, std::vector<int, std::allocator<int> > const&) [112] | |
0.00 0.00 25800/32499663 Grid::QCD::CayleyFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffComplexHalfComms> >::M5D(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, std::vector<std::complex<double>, std::allocator<std::complex<double> > >&, std::vector<std::complex<double>, std::allocator<std::complex<double> > >&, std::vector<std::complex<double>, std::allocator<std::complex<double> > >&) [38] | |
0.01 0.00 178511/32499663 frame_dummy [23] | |
0.03 0.00 422144/32499663 Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal>::DoubleStore(Grid::GridBase*, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> > const&) [30] | |
0.04 0.00 527888/32499663 Grid::QCD::SpaceTimeGrid::makeFourDimRedBlackGrid(Grid::GridCartesian const*) [67] | |
0.14 0.01 1688628/32499663 Grid::QCD::SpaceTimeGrid::makeFiveDimDWFRedBlackGrid(int, Grid::GridCartesian const*) [40] | |
0.14 0.01 1794216/32499663 Grid::QCD::SpaceTimeGrid::makeFiveDimRedBlackGrid(int, Grid::GridCartesian const*) [41] | |
2.23 0.23 27861504/32499663 Grid::GridRedBlackCartesian::CheckerBoardFromOindex(int) [18] | |
[22] 0.1 2.61 0.27 32499663+923818 std::vector<int, std::allocator<int> >::_M_default_append(unsigned long) [22] | |
0.09 0.00 296737/296762 sitmo::prng_engine::encrypt_counter() [64] | |
0.07 0.00 269928/410303 Grid::GridRedBlackCartesian::oIndex(std::vector<int, std::allocator<int> >&) [62] | |
0.06 0.00 403941/625601 Grid::GridRedBlackCartesian::CheckerBoard(std::vector<int, std::allocator<int> > const&) [63] | |
0.02 0.00 269418/1535850 Grid::GridBase::oIndex(std::vector<int, std::allocator<int> >&) [56] | |
0.02 0.00 231465/1497897 Grid::GridBase::iIndex(std::vector<int, std::allocator<int> >&) [55] | |
0.01 0.00 190280/190280 Grid::CartesianCommunicator::RankFromProcessorCoor(std::vector<int, std::allocator<int> >&) [93] | |
0.00 0.00 208792/3585944 Grid::CartesianCommunicator::ThisRank() [92] | |
923818 std::vector<int, std::allocator<int> >::_M_default_append(unsigned long) [22] | |
----------------------------------------------- | |
5536 frame_dummy [23] | |
0.03 0.00 13/778 Benchmark::Decomposition() [81] | |
0.04 0.00 17/778 Benchmark::Memory() [49] | |
0.06 0.00 24/778 Grid::GridParallelRNG::GridParallelRNG(Grid::GridBase*) [33] | |
0.55 0.02 228/778 Benchmark::DWF5(int, int) [17] | |
1.20 0.05 496/778 Benchmark::DWF(int, int, double&) [13] | |
[23] 0.1 1.89 0.07 778+5536 frame_dummy [23] | |
0.03 0.00 124573/410303 Grid::GridRedBlackCartesian::oIndex(std::vector<int, std::allocator<int> >&) [62] | |
0.03 0.00 197535/625601 Grid::GridRedBlackCartesian::CheckerBoard(std::vector<int, std::allocator<int> > const&) [63] | |
0.01 0.00 178511/32499663 std::vector<int, std::allocator<int> >::_M_default_append(unsigned long) [22] | |
5536 frame_dummy [23] | |
----------------------------------------------- | |
<spontaneous> | |
[24] 0.1 1.84 0.00 __multf3 [24] | |
----------------------------------------------- | |
<spontaneous> | |
[25] 0.1 1.74 0.00 Grid::QCD::FermionOperator<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::MooDeriv(Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> >&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, int) [25] | |
----------------------------------------------- | |
283544 std::enable_if<Grid::matchGridTensorIndex<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4>, 2>::value, Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >::type Grid::QCD::operator*<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >(Grid::QCD::Gamma const&, Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> const&) [26] | |
[26] 0.1 1.49 0.00 0+283544 std::enable_if<Grid::matchGridTensorIndex<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4>, 2>::value, Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >::type Grid::QCD::operator*<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >(Grid::QCD::Gamma const&, Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> const&) [26] | |
283544 std::enable_if<Grid::matchGridTensorIndex<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4>, 2>::value, Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >::type Grid::QCD::operator*<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >(Grid::QCD::Gamma const&, Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> const&) [26] | |
----------------------------------------------- | |
0.05 0.00 1/25 Benchmark::Memory() [49] | |
0.43 0.00 8/25 Benchmark::DWF5(int, int) [17] | |
0.86 0.00 16/25 Benchmark::DWF(int, int, double&) [13] | |
[27] 0.0 1.34 0.00 25 Grid::GridRNGbase::~GridRNGbase() [27] | |
----------------------------------------------- | |
0.00 1.16 8/8 Grid::QCD::WilsonFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::WilsonFermion5D(Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> >&, Grid::GridCartesian&, Grid::GridRedBlackCartesian&, Grid::GridCartesian&, Grid::GridRedBlackCartesian&, double, Grid::QCD::WilsonImplParams const&) [16] | |
[28] 0.0 0.00 1.16 8 Grid::QCD::WilsonFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::ImportGauge(Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> > const&) [28] | |
0.00 1.14 8/8 Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal>::DoubleStore(Grid::GridBase*, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> > const&) [31] | |
0.02 0.00 8/36 Grid::alignedAllocator<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> >::allocate(unsigned long, void const*) [66] | |
0.00 0.00 8/36 Grid::alignedAllocator<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> >::deallocate(Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4>*, unsigned long) [182] | |
----------------------------------------------- | |
0.00 1.15 4/4 Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::WilsonFermion5D(Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> >&, Grid::GridCartesian&, Grid::GridRedBlackCartesian&, Grid::GridCartesian&, Grid::GridRedBlackCartesian&, double, Grid::QCD::WilsonImplParams const&) [19] | |
[29] 0.0 0.00 1.15 4 Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::ImportGauge(Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> > const&) [29] | |
0.07 1.07 4/4 Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal>::DoubleStore(Grid::GridBase*, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> > const&) [30] | |
0.01 0.00 4/36 Grid::alignedAllocator<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> >::allocate(unsigned long, void const*) [66] | |
0.00 0.00 4/36 Grid::alignedAllocator<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> >::deallocate(Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4>*, unsigned long) [182] | |
----------------------------------------------- | |
0.07 1.07 4/4 Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::ImportGauge(Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> > const&) [29] | |
[30] 0.0 0.07 1.07 4 Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal>::DoubleStore(Grid::GridBase*, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> > const&) [30] | |
0.65 0.15 844288/844288 void Grid::peekLocalSite<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4>, Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 4> >(Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 4>&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> > const&, std::vector<int, std::allocator<int> >&) [35] | |
0.13 0.08 422144/422144 void Grid::pokeLocalSite<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8>, Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >(Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> const&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >&, std::vector<int, std::allocator<int> >&) [46] | |
0.03 0.00 422144/32499663 std::vector<int, std::allocator<int> >::_M_default_append(unsigned long) [22] | |
0.01 0.00 4/36 Grid::alignedAllocator<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> >::allocate(unsigned long, void const*) [66] | |
0.01 0.00 32/424 Grid::alignedAllocator<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >::allocate(unsigned long, void const*) [57] | |
0.00 0.01 16/48 Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > > Grid::Cshift<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >(Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > > const&, int, int) [84] | |
0.00 0.00 4/20 Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >::Lattice(Grid::GridBase*) [102] | |
0.00 0.00 52/424 Grid::alignedAllocator<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >::deallocate(Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > >*, unsigned long) [154] | |
0.00 0.00 4/36 Grid::alignedAllocator<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> >::deallocate(Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4>*, unsigned long) [182] | |
----------------------------------------------- | |
0.00 1.14 8/8 Grid::QCD::WilsonFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::ImportGauge(Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> > const&) [28] | |
[31] 0.0 0.00 1.14 8 Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal>::DoubleStore(Grid::GridBase*, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> > const&) [31] | |
0.98 0.12 32/32 void Grid::LatticeCoordinate<Grid::iScalar<Grid::Grid_simd<unsigned int, __Uint32x4_t> > >(Grid::Lattice<Grid::iScalar<Grid::Grid_simd<unsigned int, __Uint32x4_t> > >&, int) [32] | |
0.02 0.00 64/424 Grid::alignedAllocator<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >::allocate(unsigned long, void const*) [57] | |
0.00 0.01 32/48 Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > > Grid::Cshift<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >(Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > > const&, int, int) [84] | |
0.00 0.00 16/20 Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >::Lattice(Grid::GridBase*) [102] | |
0.00 0.00 112/424 Grid::alignedAllocator<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >::deallocate(Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > >*, unsigned long) [154] | |
0.00 0.00 72/72 Grid::alignedAllocator<Grid::Grid_simd<unsigned int, __Uint32x4_t> >::deallocate(Grid::Grid_simd<unsigned int, __Uint32x4_t>*, unsigned long) [170] | |
0.00 0.00 72/72 Grid::alignedAllocator<Grid::Grid_simd<unsigned int, __Uint32x4_t> >::allocate(unsigned long, void const*) [171] | |
----------------------------------------------- | |
0.98 0.12 32/32 Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal>::DoubleStore(Grid::GridBase*, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> > const&) [31] | |
[32] 0.0 0.98 0.12 32 void Grid::LatticeCoordinate<Grid::iScalar<Grid::Grid_simd<unsigned int, __Uint32x4_t> > >(Grid::Lattice<Grid::iScalar<Grid::Grid_simd<unsigned int, __Uint32x4_t> > >&, int) [32] | |
0.11 0.00 3377152/3377152 Grid::CartesianCommunicator::ProcessorCoorFromRank(int, std::vector<int, std::allocator<int> >&) [61] | |
0.01 0.00 3377152/3585944 Grid::CartesianCommunicator::ThisRank() [92] | |
0.00 0.00 32/32499663 std::vector<int, std::allocator<int> >::_M_default_append(unsigned long) [22] | |
----------------------------------------------- | |
0.00 0.35 8/24 Benchmark::DWF5(int, int) [17] | |
0.00 0.70 16/24 Benchmark::DWF(int, int, double&) [13] | |
[33] 0.0 0.00 1.05 24 Grid::GridParallelRNG::GridParallelRNG(Grid::GridBase*) [33] | |
0.78 0.00 24/25 std::vector<std::discrete_distribution<int>, std::allocator<std::discrete_distribution<int> > >::_M_fill_insert(__gnu_cxx::__normal_iterator<std::discrete_distribution<int>*, std::vector<std::discrete_distribution<int>, std::allocator<std::discrete_distribution<int> > > >, unsigned long, std::discrete_distribution<int> const&) [34] | |
0.12 0.00 24/25 std::vector<std::normal_distribution<double>, std::allocator<std::normal_distribution<double> > >::_M_fill_insert(__gnu_cxx::__normal_iterator<std::normal_distribution<double>*, std::vector<std::normal_distribution<double>, std::allocator<std::normal_distribution<double> > > >, unsigned long, std::normal_distribution<double> const&) [58] | |
0.06 0.00 24/778 frame_dummy [23] | |
0.05 0.00 24/25 std::vector<std::uniform_int_distribution<unsigned int>, std::allocator<std::uniform_int_distribution<unsigned int> > >::_M_fill_insert(__gnu_cxx::__normal_iterator<std::uniform_int_distribution<unsigned int>*, std::vector<std::uniform_int_distribution<unsigned int>, std::allocator<std::uniform_int_distribution<unsigned int> > > >, unsigned long, std::uniform_int_distribution<unsigned int> const&) [70] | |
0.04 0.00 24/25 std::vector<std::uniform_real_distribution<double>, std::allocator<std::uniform_real_distribution<double> > >::_M_fill_insert(__gnu_cxx::__normal_iterator<std::uniform_real_distribution<double>*, std::vector<std::uniform_real_distribution<double>, std::allocator<std::uniform_real_distribution<double> > > >, unsigned long, std::uniform_real_distribution<double> const&) [79] | |
----------------------------------------------- | |
0.03 0.00 1/25 Benchmark::Memory() [49] | |
0.78 0.00 24/25 Grid::GridParallelRNG::GridParallelRNG(Grid::GridBase*) [33] | |
[34] 0.0 0.81 0.00 25 std::vector<std::discrete_distribution<int>, std::allocator<std::discrete_distribution<int> > >::_M_fill_insert(__gnu_cxx::__normal_iterator<std::discrete_distribution<int>*, std::vector<std::discrete_distribution<int>, std::allocator<std::discrete_distribution<int> > > >, unsigned long, std::discrete_distribution<int> const&) [34] | |
----------------------------------------------- | |
0.65 0.15 844288/844288 Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal>::DoubleStore(Grid::GridBase*, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> > const&) [30] | |
[35] 0.0 0.65 0.15 844288 void Grid::peekLocalSite<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4>, Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 4> >(Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 4>&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> > const&, std::vector<int, std::allocator<int> >&) [35] | |
0.08 0.00 844288/1497897 Grid::GridBase::iIndex(std::vector<int, std::allocator<int> >&) [55] | |
0.07 0.00 844288/1535850 Grid::GridBase::oIndex(std::vector<int, std::allocator<int> >&) [56] | |
0.00 0.00 844288/1266432 Grid::GridCartesian::CheckerBoard(std::vector<int, std::allocator<int> > const&) [130] | |
----------------------------------------------- | |
0.22 0.00 12/36 Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::WilsonFermion5D(Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> >&, Grid::GridCartesian&, Grid::GridRedBlackCartesian&, Grid::GridCartesian&, Grid::GridRedBlackCartesian&, double, Grid::QCD::WilsonImplParams const&) [19] | |
0.43 0.00 24/36 Grid::QCD::WilsonFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::WilsonFermion5D(Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> >&, Grid::GridCartesian&, Grid::GridRedBlackCartesian&, Grid::GridCartesian&, Grid::GridRedBlackCartesian&, double, Grid::QCD::WilsonImplParams const&) [16] | |
[36] 0.0 0.65 0.00 36 Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::BuildSurfaceList(int, int) [36] | |
----------------------------------------------- | |
<spontaneous> | |
[37] 0.0 0.65 0.00 __trunctfdf2 [37] | |
----------------------------------------------- | |
18720 Grid::QCD::CayleyFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffComplexHalfComms> >::M5D(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, std::vector<std::complex<double>, std::allocator<std::complex<double> > >&, std::vector<std::complex<double>, std::allocator<std::complex<double> > >&, std::vector<std::complex<double>, std::allocator<std::complex<double> > >&) [38] | |
0.04 0.00 120/1560 Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::Reporti(int) [77] | |
0.11 0.01 304/1560 Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::Report() [48] | |
0.18 0.01 528/1560 Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::Report() [47] | |
0.21 0.01 608/1560 Grid::QCD::WilsonFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::Report() [43] | |
[38] 0.0 0.54 0.03 1560+18720 Grid::QCD::CayleyFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffComplexHalfComms> >::M5D(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, std::vector<std::complex<double>, std::allocator<std::complex<double> > >&, std::vector<std::complex<double>, std::allocator<std::complex<double> > >&, std::vector<std::complex<double>, std::allocator<std::complex<double> > >&) [38] | |
0.02 0.00 167755/167755 Grid::Grid_simd<unsigned int, __Uint32x4_t> Grid::Comparison<Grid::seq<unsigned int, unsigned int>, Grid::Grid_simd<unsigned int, __Uint32x4_t>, 0>(Grid::seq<unsigned int, unsigned int>, Grid::Grid_simd<unsigned int, __Uint32x4_t> const&, Grid::Grid_simd<unsigned int, __Uint32x4_t>::scalar_type const&) [85] | |
0.00 0.00 15802/410303 Grid::GridRedBlackCartesian::oIndex(std::vector<int, std::allocator<int> >&) [62] | |
0.00 0.00 24125/625601 Grid::GridRedBlackCartesian::CheckerBoard(std::vector<int, std::allocator<int> > const&) [63] | |
0.00 0.00 25800/32499663 std::vector<int, std::allocator<int> >::_M_default_append(unsigned long) [22] | |
18720 Grid::QCD::CayleyFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffComplexHalfComms> >::M5D(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, std::vector<std::complex<double>, std::allocator<std::complex<double> > >&, std::vector<std::complex<double>, std::allocator<std::complex<double> > >&, std::vector<std::complex<double>, std::allocator<std::complex<double> > >&) [38] | |
----------------------------------------------- | |
<spontaneous> | |
[39] 0.0 0.48 0.00 __extenddftf2 [39] | |
----------------------------------------------- | |
0.31 0.15 4/4 Benchmark::DWF5(int, int) [17] | |
[40] 0.0 0.31 0.15 4 Grid::QCD::SpaceTimeGrid::makeFiveDimDWFRedBlackGrid(int, Grid::GridCartesian const*) [40] | |
0.14 0.01 1688628/32499663 std::vector<int, std::allocator<int> >::_M_default_append(unsigned long) [22] | |
0.00 0.00 4/8 Grid::QCD::SpaceTimeGrid::makeFiveDimDWFGrid(int, Grid::GridCartesian const*) [114] | |
0.00 0.00 4/52 Grid::CartesianCommunicator::CartesianCommunicator(std::vector<int, std::allocator<int> > const&, Grid::CartesianCommunicator const&, int&) [115] | |
0.00 0.00 12/620 void std::vector<int, std::allocator<int> >::_M_realloc_insert<int const&>(__gnu_cxx::__normal_iterator<int*, std::vector<int, std::allocator<int> > >, int const&) [151] | |
0.00 0.00 4/191 std::vector<int, std::allocator<int> >::operator=(std::vector<int, std::allocator<int> > const&) [157] | |
0.00 0.00 4/23 Grid::CartesianCommunicator::~CartesianCommunicator() [193] | |
----------------------------------------------- | |
0.28 0.16 8/8 Benchmark::DWF(int, int, double&) [13] | |
[41] 0.0 0.28 0.16 8 Grid::QCD::SpaceTimeGrid::makeFiveDimRedBlackGrid(int, Grid::GridCartesian const*) [41] | |
0.14 0.01 1794216/32499663 std::vector<int, std::allocator<int> >::_M_default_append(unsigned long) [22] | |
0.00 0.00 8/16 Grid::QCD::SpaceTimeGrid::makeFiveDimGrid(int, Grid::GridCartesian const*) [113] | |
0.00 0.00 8/52 Grid::CartesianCommunicator::CartesianCommunicator(std::vector<int, std::allocator<int> > const&, Grid::CartesianCommunicator const&, int&) [115] | |
0.00 0.00 24/620 void std::vector<int, std::allocator<int> >::_M_realloc_insert<int const&>(__gnu_cxx::__normal_iterator<int*, std::vector<int, std::allocator<int> > >, int const&) [151] | |
0.00 0.00 8/191 std::vector<int, std::allocator<int> >::operator=(std::vector<int, std::allocator<int> > const&) [157] | |
0.00 0.00 8/23 Grid::CartesianCommunicator::~CartesianCommunicator() [193] | |
----------------------------------------------- | |
0.14 0.00 64/180 Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > Grid::Cshift<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, int, int) [54] | |
0.25 0.00 116/180 Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >::Lattice(Grid::GridBase*) [45] | |
[42] 0.0 0.39 0.00 180 Grid::alignedAllocator<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >::allocate(unsigned long, void const*) [42] | |
0.00 0.00 180/1325 Grid::PointerCache::Lookup(unsigned long) [149] | |
----------------------------------------------- | |
0.00 0.38 32/32 Benchmark::DWF(int, int, double&) [13] | |
[43] 0.0 0.00 0.38 32 Grid::QCD::WilsonFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::Report() [43] | |
0.21 0.01 608/1560 Grid::QCD::CayleyFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffComplexHalfComms> >::M5D(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, std::vector<std::complex<double>, std::allocator<std::complex<double> > >&, std::vector<std::complex<double>, std::allocator<std::complex<double> > >&, std::vector<std::complex<double>, std::allocator<std::complex<double> > >&) [38] | |
0.00 0.13 96/144 Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::Report() [47] | |
0.00 0.03 96/144 Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::Reporti(int) [77] | |
0.00 0.00 32/48 std::vector<int, std::allocator<int> >::vector(std::vector<int, std::allocator<int> > const&) [176] | |
0.00 0.00 32/672 Grid::CartesianCommunicator::GlobalSum(double&) [150] | |
----------------------------------------------- | |
<spontaneous> | |
[44] 0.0 0.27 0.00 Grid::QCD::WilsonKernels<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, Grid::QCD::TwoIndexRep<3, (Grid::QCD::TwoIndexSymmetry)1>, Grid::QCD::CoeffReal> >::ContractConservedCurrentSiteBwd(Grid::iScalar<Grid::iMatrix<Grid::iMatrix<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, 6>, 4> > const&, Grid::iScalar<Grid::iMatrix<Grid::iMatrix<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, 6>, 4> > const&, Grid::iScalar<Grid::iMatrix<Grid::iMatrix<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, 6>, 4> >&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, 6> >, 8> >&, unsigned int, unsigned int, bool) [44] | |
----------------------------------------------- | |
0.00 0.01 4/116 Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::WilsonFermion5D(Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> >&, Grid::GridCartesian&, Grid::GridRedBlackCartesian&, Grid::GridCartesian&, Grid::GridRedBlackCartesian&, double, Grid::QCD::WilsonImplParams const&) [19] | |
0.00 0.02 8/116 Grid::QCD::WilsonFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::WilsonFermion5D(Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> >&, Grid::GridCartesian&, Grid::GridRedBlackCartesian&, Grid::GridCartesian&, Grid::GridRedBlackCartesian&, double, Grid::QCD::WilsonImplParams const&) [16] | |
0.00 0.07 32/116 Benchmark::DWF5(int, int) [17] | |
0.00 0.16 72/116 Benchmark::DWF(int, int, double&) [13] | |
[45] 0.0 0.00 0.25 116 Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >::Lattice(Grid::GridBase*) [45] | |
0.25 0.00 116/180 Grid::alignedAllocator<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >::allocate(unsigned long, void const*) [42] | |
----------------------------------------------- | |
0.13 0.08 422144/422144 Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal>::DoubleStore(Grid::GridBase*, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> > const&) [30] | |
[46] 0.0 0.13 0.08 422144 void Grid::pokeLocalSite<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8>, Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >(Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> const&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >&, std::vector<int, std::allocator<int> >&) [46] | |
0.04 0.00 422144/1497897 Grid::GridBase::iIndex(std::vector<int, std::allocator<int> >&) [55] | |
0.04 0.00 422144/1535850 Grid::GridBase::oIndex(std::vector<int, std::allocator<int> >&) [56] | |
0.00 0.00 422144/1266432 Grid::GridCartesian::CheckerBoard(std::vector<int, std::allocator<int> > const&) [130] | |
----------------------------------------------- | |
0.00 0.06 48/144 Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::Report() [48] | |
0.00 0.13 96/144 Grid::QCD::WilsonFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::Report() [43] | |
[47] 0.0 0.00 0.19 144 Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::Report() [47] | |
0.18 0.01 528/1560 Grid::QCD::CayleyFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffComplexHalfComms> >::M5D(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, std::vector<std::complex<double>, std::allocator<std::complex<double> > >&, std::vector<std::complex<double>, std::allocator<std::complex<double> > >&, std::vector<std::complex<double>, std::allocator<std::complex<double> > >&) [38] | |
0.00 0.00 624/672 Grid::CartesianCommunicator::GlobalSum(double&) [150] | |
----------------------------------------------- | |
0.00 0.19 16/16 Benchmark::DWF5(int, int) [17] | |
[48] 0.0 0.00 0.19 16 Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::Report() [48] | |
0.11 0.01 304/1560 Grid::QCD::CayleyFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffComplexHalfComms> >::M5D(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, std::vector<std::complex<double>, std::allocator<std::complex<double> > >&, std::vector<std::complex<double>, std::allocator<std::complex<double> > >&, std::vector<std::complex<double>, std::allocator<std::complex<double> > >&) [38] | |
0.00 0.06 48/144 Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::Report() [47] | |
0.00 0.01 48/144 Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::Reporti(int) [77] | |
0.00 0.00 16/48 std::vector<int, std::allocator<int> >::vector(std::vector<int, std::allocator<int> > const&) [176] | |
0.00 0.00 16/672 Grid::CartesianCommunicator::GlobalSum(double&) [150] | |
----------------------------------------------- | |
<spontaneous> | |
[49] 0.0 0.01 0.18 Benchmark::Memory() [49] | |
0.05 0.00 1/25 Grid::GridRNGbase::~GridRNGbase() [27] | |
0.04 0.00 17/778 frame_dummy [23] | |
0.04 0.00 33/33 Grid::alignedAllocator<Grid::iVector<Grid::Grid_simd<float, __Float32x4_t>, 8> >::allocate(unsigned long, void const*) [78] | |
0.03 0.00 1/25 std::vector<std::discrete_distribution<int>, std::allocator<std::discrete_distribution<int> > >::_M_fill_insert(__gnu_cxx::__normal_iterator<std::discrete_distribution<int>*, std::vector<std::discrete_distribution<int>, std::allocator<std::discrete_distribution<int> > > >, unsigned long, std::discrete_distribution<int> const&) [34] | |
0.01 0.00 1/25 std::vector<std::normal_distribution<double>, std::allocator<std::normal_distribution<double> > >::_M_fill_insert(__gnu_cxx::__normal_iterator<std::normal_distribution<double>*, std::vector<std::normal_distribution<double>, std::allocator<std::normal_distribution<double> > > >, unsigned long, std::normal_distribution<double> const&) [58] | |
0.00 0.00 1/25 std::vector<std::uniform_int_distribution<unsigned int>, std::allocator<std::uniform_int_distribution<unsigned int> > >::_M_fill_insert(__gnu_cxx::__normal_iterator<std::uniform_int_distribution<unsigned int>*, std::vector<std::uniform_int_distribution<unsigned int>, std::allocator<std::uniform_int_distribution<unsigned int> > > >, unsigned long, std::uniform_int_distribution<unsigned int> const&) [70] | |
0.00 0.00 1/25 std::vector<std::uniform_real_distribution<double>, std::allocator<std::uniform_real_distribution<double> > >::_M_fill_insert(__gnu_cxx::__normal_iterator<std::uniform_real_distribution<double>*, std::vector<std::uniform_real_distribution<double>, std::allocator<std::uniform_real_distribution<double> > > >, unsigned long, std::uniform_real_distribution<double> const&) [79] | |
0.00 0.00 132/32499663 std::vector<int, std::allocator<int> >::_M_default_append(unsigned long) [22] | |
0.00 0.00 11/39 Grid::CartesianCommunicator::CartesianCommunicator(std::vector<int, std::allocator<int> > const&) [117] | |
0.00 0.00 1/296762 sitmo::prng_engine::encrypt_counter() [64] | |
0.00 0.00 33/33 Grid::alignedAllocator<Grid::iVector<Grid::Grid_simd<float, __Float32x4_t>, 8> >::deallocate(Grid::iVector<Grid::Grid_simd<float, __Float32x4_t>, 8>*, unsigned long) [185] | |
0.00 0.00 12/36 Grid::CartesianCommunicator::BroadcastWorld(int, void*, int) [183] | |
0.00 0.00 11/23 Grid::CartesianCommunicator::~CartesianCommunicator() [193] | |
0.00 0.00 1/42 Grid::GridDefaultMpi() [177] | |
0.00 0.00 1/31 Grid::GridDefaultSimd(int, int) [189] | |
0.00 0.00 1/25 std::seed_seq::seed_seq<__gnu_cxx::__normal_iterator<int const*, std::vector<int, std::allocator<int> > > >(__gnu_cxx::__normal_iterator<int const*, std::vector<int, std::allocator<int> > >, __gnu_cxx::__normal_iterator<int const*, std::vector<int, std::allocator<int> > >) [190] | |
----------------------------------------------- | |
1108128 Grid::LebesgueOrder::IterateI(int, int, std::vector<int, std::allocator<int> >&, std::vector<int, std::allocator<int> >&, std::vector<int, std::allocator<int> >&) [50] | |
0.18 0.00 79152/79152 Grid::LebesgueOrder::IterateO(int, int, std::vector<int, std::allocator<int> >&, std::vector<int, std::allocator<int> >&, std::vector<int, std::allocator<int> >&) [51] | |
[50] 0.0 0.18 0.00 79152+1108128 Grid::LebesgueOrder::IterateI(int, int, std::vector<int, std::allocator<int> >&, std::vector<int, std::allocator<int> >&, std::vector<int, std::allocator<int> >&) [50] | |
0.00 0.00 368/620 void std::vector<int, std::allocator<int> >::_M_realloc_insert<int const&>(__gnu_cxx::__normal_iterator<int*, std::vector<int, std::allocator<int> > >, int const&) [151] | |
1108128 Grid::LebesgueOrder::IterateI(int, int, std::vector<int, std::allocator<int> >&, std::vector<int, std::allocator<int> >&, std::vector<int, std::allocator<int> >&) [50] | |
----------------------------------------------- | |
0.00 0.18 1040/1040 Grid::LebesgueOrder::CartesianBlocking() [52] | |
[51] 0.0 0.00 0.18 1040 Grid::LebesgueOrder::IterateO(int, int, std::vector<int, std::allocator<int> >&, std::vector<int, std::allocator<int> >&, std::vector<int, std::allocator<int> >&) [51] | |
0.18 0.00 79152/79152 Grid::LebesgueOrder::IterateI(int, int, std::vector<int, std::allocator<int> >&, std::vector<int, std::allocator<int> >&, std::vector<int, std::allocator<int> >&) [50] | |
----------------------------------------------- | |
0.00 0.18 24/24 Grid::LebesgueOrder::LebesgueOrder(Grid::GridBase*) [53] | |
[52] 0.0 0.00 0.18 24 Grid::LebesgueOrder::CartesianBlocking() [52] | |
0.00 0.18 1040/1040 Grid::LebesgueOrder::IterateO(int, int, std::vector<int, std::allocator<int> >&, std::vector<int, std::allocator<int> >&, std::vector<int, std::allocator<int> >&) [51] | |
----------------------------------------------- | |
0.00 0.06 8/24 Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::WilsonFermion5D(Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> >&, Grid::GridCartesian&, Grid::GridRedBlackCartesian&, Grid::GridCartesian&, Grid::GridRedBlackCartesian&, double, Grid::QCD::WilsonImplParams const&) [19] | |
0.00 0.12 16/24 Grid::QCD::WilsonFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::WilsonFermion5D(Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> >&, Grid::GridCartesian&, Grid::GridRedBlackCartesian&, Grid::GridCartesian&, Grid::GridRedBlackCartesian&, double, Grid::QCD::WilsonImplParams const&) [16] | |
[53] 0.0 0.00 0.18 24 Grid::LebesgueOrder::LebesgueOrder(Grid::GridBase*) [53] | |
0.00 0.18 24/24 Grid::LebesgueOrder::CartesianBlocking() [52] | |
----------------------------------------------- | |
0.00 0.15 64/64 Benchmark::DWF(int, int, double&) [13] | |
[54] 0.0 0.00 0.15 64 Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > Grid::Cshift<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, int, int) [54] | |
0.14 0.00 64/180 Grid::alignedAllocator<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >::allocate(unsigned long, void const*) [42] | |
0.00 0.01 64/64 void Grid::Cshift_local<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, int, int, int) [90] | |
0.00 0.00 128/3206 Grid::GridCartesian::CheckerBoardShiftForCB(int, int, int, int) [144] | |
0.00 0.00 64/224 Grid::GridCartesian::CheckerBoardDestination(int, int, int) [155] | |
----------------------------------------------- | |
0.02 0.00 231465/1497897 std::vector<int, std::allocator<int> >::_M_default_append(unsigned long) [22] | |
0.04 0.00 422144/1497897 void Grid::pokeLocalSite<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8>, Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >(Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> const&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >&, std::vector<int, std::allocator<int> >&) [46] | |
0.08 0.00 844288/1497897 void Grid::peekLocalSite<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4>, Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 4> >(Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 4>&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> > const&, std::vector<int, std::allocator<int> >&) [35] | |
[55] 0.0 0.14 0.00 1497897 Grid::GridBase::iIndex(std::vector<int, std::allocator<int> >&) [55] | |
----------------------------------------------- | |
0.02 0.00 269418/1535850 std::vector<int, std::allocator<int> >::_M_default_append(unsigned long) [22] | |
0.04 0.00 422144/1535850 void Grid::pokeLocalSite<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8>, Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >(Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> const&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >&, std::vector<int, std::allocator<int> >&) [46] | |
0.07 0.00 844288/1535850 void Grid::peekLocalSite<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4>, Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 4> >(Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 4>&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> > const&, std::vector<int, std::allocator<int> >&) [35] | |
[56] 0.0 0.14 0.00 1535850 Grid::GridBase::oIndex(std::vector<int, std::allocator<int> >&) [56] | |
----------------------------------------------- | |
0.00 0.00 4/424 Benchmark::DWF5(int, int) [17] | |
0.01 0.00 20/424 Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >::Lattice(Grid::GridBase*) [102] | |
0.01 0.00 32/424 Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal>::DoubleStore(Grid::GridBase*, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> > const&) [30] | |
0.01 0.00 48/424 Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > > Grid::Cshift<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >(Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > > const&, int, int) [84] | |
0.02 0.00 64/424 Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal>::DoubleStore(Grid::GridBase*, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> > const&) [31] | |
0.03 0.00 112/424 Benchmark::DWF(int, int, double&) [13] | |
0.04 0.00 144/424 void Grid::QCD::SU<3>::LieRandomize<Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > > >(Grid::GridParallelRNG&, Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >&, double) [76] | |
[57] 0.0 0.13 0.00 424 Grid::alignedAllocator<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >::allocate(unsigned long, void const*) [57] | |
0.00 0.00 424/1325 Grid::PointerCache::Lookup(unsigned long) [149] | |
----------------------------------------------- | |
0.01 0.00 1/25 Benchmark::Memory() [49] | |
0.12 0.00 24/25 Grid::GridParallelRNG::GridParallelRNG(Grid::GridBase*) [33] | |
[58] 0.0 0.13 0.00 25 std::vector<std::normal_distribution<double>, std::allocator<std::normal_distribution<double> > >::_M_fill_insert(__gnu_cxx::__normal_iterator<std::normal_distribution<double>*, std::vector<std::normal_distribution<double>, std::allocator<std::normal_distribution<double> > > >, unsigned long, std::normal_distribution<double> const&) [58] | |
----------------------------------------------- | |
0.12 0.00 36/36 std::vector<Grid::StencilEntry, Grid::alignedAllocator<Grid::StencilEntry> >::_M_default_append(unsigned long) [60] | |
[59] 0.0 0.12 0.00 36 Grid::alignedAllocator<Grid::StencilEntry>::allocate(unsigned long, void const*) [59] | |
0.00 0.00 36/1325 Grid::PointerCache::Lookup(unsigned long) [149] | |
----------------------------------------------- | |
0.00 0.12 36/36 Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::CartesianStencil(Grid::GridBase*, int, int, std::vector<int, std::allocator<int> > const&, std::vector<int, std::allocator<int> > const&) [14] | |
[60] 0.0 0.00 0.12 36 std::vector<Grid::StencilEntry, Grid::alignedAllocator<Grid::StencilEntry> >::_M_default_append(unsigned long) [60] | |
0.12 0.00 36/36 Grid::alignedAllocator<Grid::StencilEntry>::allocate(unsigned long, void const*) [59] | |
----------------------------------------------- | |
0.11 0.00 3377152/3377152 void Grid::LatticeCoordinate<Grid::iScalar<Grid::Grid_simd<unsigned int, __Uint32x4_t> > >(Grid::Lattice<Grid::iScalar<Grid::Grid_simd<unsigned int, __Uint32x4_t> > >&, int) [32] | |
[61] 0.0 0.11 0.00 3377152 Grid::CartesianCommunicator::ProcessorCoorFromRank(int, std::vector<int, std::allocator<int> >&) [61] | |
----------------------------------------------- | |
0.00 0.00 15802/410303 Grid::QCD::CayleyFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffComplexHalfComms> >::M5D(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, std::vector<std::complex<double>, std::allocator<std::complex<double> > >&, std::vector<std::complex<double>, std::allocator<std::complex<double> > >&, std::vector<std::complex<double>, std::allocator<std::complex<double> > >&) [38] | |
0.03 0.00 124573/410303 frame_dummy [23] | |
0.07 0.00 269928/410303 std::vector<int, std::allocator<int> >::_M_default_append(unsigned long) [22] | |
[62] 0.0 0.10 0.00 410303 Grid::GridRedBlackCartesian::oIndex(std::vector<int, std::allocator<int> >&) [62] | |
----------------------------------------------- | |
0.00 0.00 24125/625601 Grid::QCD::CayleyFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffComplexHalfComms> >::M5D(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, std::vector<std::complex<double>, std::allocator<std::complex<double> > >&, std::vector<std::complex<double>, std::allocator<std::complex<double> > >&, std::vector<std::complex<double>, std::allocator<std::complex<double> > >&) [38] | |
0.03 0.00 197535/625601 frame_dummy [23] | |
0.06 0.00 403941/625601 std::vector<int, std::allocator<int> >::_M_default_append(unsigned long) [22] | |
[63] 0.0 0.09 0.00 625601 Grid::GridRedBlackCartesian::CheckerBoard(std::vector<int, std::allocator<int> > const&) [63] | |
----------------------------------------------- | |
0.00 0.00 1/296762 Benchmark::Memory() [49] | |
0.00 0.00 24/296762 Grid::GridParallelRNG::SeedFixedIntegers(std::vector<int, std::allocator<int> > const&) [104] | |
0.09 0.00 296737/296762 std::vector<int, std::allocator<int> >::_M_default_append(unsigned long) [22] | |
[64] 0.0 0.09 0.00 296762 sitmo::prng_engine::encrypt_counter() [64] | |
----------------------------------------------- | |
397821 Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > const Grid::predicatedWhere<Grid::Grid_simd<unsigned int, __Uint32x4_t> const&, Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > const, Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > const>(Grid::Grid_simd<unsigned int, __Uint32x4_t> const& const&, Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > const&, Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > const&) [65] | |
[65] 0.0 0.09 0.00 0+397821 Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > const Grid::predicatedWhere<Grid::Grid_simd<unsigned int, __Uint32x4_t> const&, Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > const, Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > const>(Grid::Grid_simd<unsigned int, __Uint32x4_t> const& const&, Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > const&, Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > const&) [65] | |
397821 Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > const Grid::predicatedWhere<Grid::Grid_simd<unsigned int, __Uint32x4_t> const&, Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > const, Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > const>(Grid::Grid_simd<unsigned int, __Uint32x4_t> const& const&, Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > const&, Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > const&) [65] | |
----------------------------------------------- | |
0.01 0.00 4/36 Benchmark::DWF5(int, int) [17] | |
0.01 0.00 4/36 Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal>::DoubleStore(Grid::GridBase*, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> > const&) [30] | |
0.01 0.00 4/36 Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::ImportGauge(Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> > const&) [29] | |
0.02 0.00 8/36 Grid::QCD::WilsonFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::ImportGauge(Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> > const&) [28] | |
0.04 0.00 16/36 Benchmark::DWF(int, int, double&) [13] | |
[66] 0.0 0.09 0.00 36 Grid::alignedAllocator<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> >::allocate(unsigned long, void const*) [66] | |
0.00 0.00 36/1325 Grid::PointerCache::Lookup(unsigned long) [149] | |
----------------------------------------------- | |
0.02 0.02 8/16 Benchmark::DWF(int, int, double&) [13] | |
0.02 0.02 8/16 Benchmark::DWF5(int, int) [17] | |
[67] 0.0 0.04 0.05 16 Grid::QCD::SpaceTimeGrid::makeFourDimRedBlackGrid(Grid::GridCartesian const*) [67] | |
0.04 0.00 527888/32499663 std::vector<int, std::allocator<int> >::_M_default_append(unsigned long) [22] | |
0.00 0.00 16/52 Grid::CartesianCommunicator::CartesianCommunicator(std::vector<int, std::allocator<int> > const&, Grid::CartesianCommunicator const&, int&) [115] | |
0.00 0.00 16/191 std::vector<int, std::allocator<int> >::operator=(std::vector<int, std::allocator<int> > const&) [157] | |
----------------------------------------------- | |
<spontaneous> | |
[68] 0.0 0.06 0.00 Grid::QCD::WilsonKernels<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::HandDhopSiteDag(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >&, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >*, int, int, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&) [68] | |
----------------------------------------------- | |
<spontaneous> | |
[69] 0.0 0.06 0.00 __divdc3 [69] | |
----------------------------------------------- | |
0.00 0.00 1/25 Benchmark::Memory() [49] | |
0.05 0.00 24/25 Grid::GridParallelRNG::GridParallelRNG(Grid::GridBase*) [33] | |
[70] 0.0 0.05 0.00 25 std::vector<std::uniform_int_distribution<unsigned int>, std::allocator<std::uniform_int_distribution<unsigned int> > >::_M_fill_insert(__gnu_cxx::__normal_iterator<std::uniform_int_distribution<unsigned int>*, std::vector<std::uniform_int_distribution<unsigned int>, std::allocator<std::uniform_int_distribution<unsigned int> > > >, unsigned long, std::uniform_int_distribution<unsigned int> const&) [70] | |
----------------------------------------------- | |
0.05 0.00 24/24 Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >::Lattice(Grid::GridBase*) [72] | |
[71] 0.0 0.05 0.00 24 Grid::alignedAllocator<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >::allocate(unsigned long, void const*) [71] | |
0.00 0.00 24/1325 Grid::PointerCache::Lookup(unsigned long) [149] | |
----------------------------------------------- | |
0.00 0.05 24/24 Grid::QCD::WilsonFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::WilsonFermion5D(Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> >&, Grid::GridCartesian&, Grid::GridRedBlackCartesian&, Grid::GridCartesian&, Grid::GridRedBlackCartesian&, double, Grid::QCD::WilsonImplParams const&) [16] | |
[72] 0.0 0.00 0.05 24 Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >::Lattice(Grid::GridBase*) [72] | |
0.05 0.00 24/24 Grid::alignedAllocator<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >::allocate(unsigned long, void const*) [71] | |
----------------------------------------------- | |
<spontaneous> | |
[73] 0.0 0.05 0.00 Grid::Gather_plane_table_compute(Grid::GridBase*, int, int, int, int, std::vector<std::pair<int, int>, std::allocator<std::pair<int, int> > >&) [73] | |
----------------------------------------------- | |
<spontaneous> | |
[74] 0.0 0.05 0.00 Grid::QCD::WilsonKernels<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffComplex> >::HandDhopSiteDagExt(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, 3> >, 8> >&, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, 3>, 2> >*, int, int, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, 3>, 4> > >&) [74] | |
----------------------------------------------- | |
<spontaneous> | |
[75] 0.0 0.05 0.00 Grid::QCD::WilsonKernels<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::TwoIndexRep<3, (Grid::QCD::TwoIndexSymmetry)-1>, Grid::QCD::CoeffReal> >::DhopDir(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >&, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >*, int, int, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, int, int) [75] | |
----------------------------------------------- | |
0.00 0.01 16/48 Benchmark::DWF5(int, int) [17] | |
0.00 0.03 32/48 Benchmark::DWF(int, int, double&) [13] | |
[76] 0.0 0.00 0.04 48 void Grid::QCD::SU<3>::LieRandomize<Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > > >(Grid::GridParallelRNG&, Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >&, double) [76] | |
0.04 0.00 144/424 Grid::alignedAllocator<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >::allocate(unsigned long, void const*) [57] | |
0.00 0.00 432/432 Grid::alignedAllocator<Grid::iScalar<Grid::iScalar<Grid::iScalar<Grid::Grid_simd<std::complex<float>, __Float32x4_t> > > > >::deallocate(Grid::iScalar<Grid::iScalar<Grid::iScalar<Grid::Grid_simd<std::complex<float>, __Float32x4_t> > > >*, unsigned long) [152] | |
0.00 0.00 432/432 Grid::alignedAllocator<Grid::iScalar<Grid::iScalar<Grid::iScalar<Grid::Grid_simd<std::complex<float>, __Float32x4_t> > > > >::allocate(unsigned long, void const*) [153] | |
0.00 0.00 144/424 Grid::alignedAllocator<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >::deallocate(Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > >*, unsigned long) [154] | |
----------------------------------------------- | |
0.00 0.01 48/144 Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::Report() [48] | |
0.00 0.03 96/144 Grid::QCD::WilsonFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::Report() [43] | |
[77] 0.0 0.00 0.04 144 Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::Reporti(int) [77] | |
0.04 0.00 120/1560 Grid::QCD::CayleyFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffComplexHalfComms> >::M5D(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, std::vector<std::complex<double>, std::allocator<std::complex<double> > >&, std::vector<std::complex<double>, std::allocator<std::complex<double> > >&, std::vector<std::complex<double>, std::allocator<std::complex<double> > >&) [38] | |
----------------------------------------------- | |
0.04 0.00 33/33 Benchmark::Memory() [49] | |
[78] 0.0 0.04 0.00 33 Grid::alignedAllocator<Grid::iVector<Grid::Grid_simd<float, __Float32x4_t>, 8> >::allocate(unsigned long, void const*) [78] | |
0.00 0.00 33/1325 Grid::PointerCache::Lookup(unsigned long) [149] | |
----------------------------------------------- | |
0.00 0.00 1/25 Benchmark::Memory() [49] | |
0.04 0.00 24/25 Grid::GridParallelRNG::GridParallelRNG(Grid::GridBase*) [33] | |
[79] 0.0 0.04 0.00 25 std::vector<std::uniform_real_distribution<double>, std::allocator<std::uniform_real_distribution<double> > >::_M_fill_insert(__gnu_cxx::__normal_iterator<std::uniform_real_distribution<double>*, std::vector<std::uniform_real_distribution<double>, std::allocator<std::uniform_real_distribution<double> > > >, unsigned long, std::uniform_real_distribution<double> const&) [79] | |
----------------------------------------------- | |
<spontaneous> | |
[80] 0.0 0.04 0.00 Grid::QCD::WilsonKernels<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::HandDhopSiteDag(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >&, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >*, int, int, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&) [80] | |
----------------------------------------------- | |
<spontaneous> | |
[81] 0.0 0.00 0.03 Benchmark::Decomposition() [81] | |
0.03 0.00 13/778 frame_dummy [23] | |
0.00 0.00 7/55 Grid::GridCmdVectorIntToString[abi:cxx11](std::vector<int, std::allocator<int> > const&) [173] | |
0.00 0.00 6/31 Grid::GridDefaultSimd(int, int) [189] | |
0.00 0.00 1/42 Grid::GridDefaultMpi() [177] | |
----------------------------------------------- | |
<spontaneous> | |
[82] 0.0 0.03 0.00 Grid::QCD::WilsonKernels<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::DhopDir(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >&, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >*, int, int, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, int, int) [82] | |
----------------------------------------------- | |
0.00 0.02 38464/38464 Benchmark::DWF(int, int, double&) [13] | |
[83] 0.0 0.00 0.02 38464 Grid::QCD::WilsonFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::DhopInternal(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, int) [83] | |
0.01 0.01 19232/19232 Grid::QCD::WilsonFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::DhopInternalOverlappedComms(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, int) [89] | |
0.00 0.01 19232/19232 Grid::QCD::WilsonFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::DhopInternalSerialComms(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, int) [100] | |
----------------------------------------------- | |
0.00 0.01 16/48 Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal>::DoubleStore(Grid::GridBase*, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> > const&) [30] | |
0.00 0.01 32/48 Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal>::DoubleStore(Grid::GridBase*, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> > const&) [31] | |
[84] 0.0 0.00 0.02 48 Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > > Grid::Cshift<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >(Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > > const&, int, int) [84] | |
0.01 0.00 48/424 Grid::alignedAllocator<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >::allocate(unsigned long, void const*) [57] | |
0.00 0.01 48/48 void Grid::Cshift_local<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >(Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >&, Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > > const&, int, int, int) [103] | |
0.00 0.00 96/3206 Grid::GridCartesian::CheckerBoardShiftForCB(int, int, int, int) [144] | |
0.00 0.00 48/224 Grid::GridCartesian::CheckerBoardDestination(int, int, int) [155] | |
----------------------------------------------- | |
0.02 0.00 167755/167755 Grid::QCD::CayleyFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffComplexHalfComms> >::M5D(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, std::vector<std::complex<double>, std::allocator<std::complex<double> > >&, std::vector<std::complex<double>, std::allocator<std::complex<double> > >&, std::vector<std::complex<double>, std::allocator<std::complex<double> > >&) [38] | |
[85] 0.0 0.02 0.00 167755 Grid::Grid_simd<unsigned int, __Uint32x4_t> Grid::Comparison<Grid::seq<unsigned int, unsigned int>, Grid::Grid_simd<unsigned int, __Uint32x4_t>, 0>(Grid::seq<unsigned int, unsigned int>, Grid::Grid_simd<unsigned int, __Uint32x4_t> const&, Grid::Grid_simd<unsigned int, __Uint32x4_t>::scalar_type const&) [85] | |
----------------------------------------------- | |
0.00 0.00 8800/112128 Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::DhopInternalOverlappedComms(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, int) [109] | |
0.00 0.00 19232/112128 Grid::QCD::WilsonFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::DhopInternalOverlappedComms(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, int) [89] | |
0.01 0.00 28032/112128 void Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloExchangeOpt<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void>&) [95] | |
0.01 0.00 56064/112128 void Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::CommsMergeSHM<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void> >(Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void>) [94] | |
[86] 0.0 0.02 0.00 112128 void Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::CommsMerge<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void> >(Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void>, std::vector<Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::Merge, std::allocator<Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::Merge> >&, std::vector<Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::Decompress, std::allocator<Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::Decompress> >&) [86] | |
----------------------------------------------- | |
0.02 0.00 12/12 Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >::Lattice(Grid::GridBase*) [88] | |
[87] 0.0 0.02 0.00 12 Grid::alignedAllocator<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >::allocate(unsigned long, void const*) [87] | |
0.00 0.00 12/1325 Grid::PointerCache::Lookup(unsigned long) [149] | |
----------------------------------------------- | |
0.00 0.02 12/12 Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::WilsonFermion5D(Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> >&, Grid::GridCartesian&, Grid::GridRedBlackCartesian&, Grid::GridCartesian&, Grid::GridRedBlackCartesian&, double, Grid::QCD::WilsonImplParams const&) [19] | |
[88] 0.0 0.00 0.02 12 Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >::Lattice(Grid::GridBase*) [88] | |
0.02 0.00 12/12 Grid::alignedAllocator<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >::allocate(unsigned long, void const*) [87] | |
----------------------------------------------- | |
0.01 0.01 19232/19232 Grid::QCD::WilsonFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::DhopInternal(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, int) [83] | |
[89] 0.0 0.01 0.01 19232 Grid::QCD::WilsonFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::DhopInternalOverlappedComms(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, int) [89] | |
0.00 0.00 19232/56064 void Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::CommsMergeSHM<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void> >(Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void>) [94] | |
0.00 0.00 19232/112128 void Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::CommsMerge<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void> >(Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void>, std::vector<Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::Merge, std::allocator<Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::Merge> >&, std::vector<Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::Decompress, std::allocator<Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::Decompress> >&) [86] | |
0.00 0.00 19232/56064 Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::Prepare() [140] | |
0.00 0.00 19232/28032 void Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloGatherOpt<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void>&) [142] | |
----------------------------------------------- | |
0.00 0.01 64/64 Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > Grid::Cshift<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, int, int) [54] | |
[90] 0.0 0.00 0.01 64 void Grid::Cshift_local<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, int, int, int) [90] | |
0.01 0.00 16/16 void Grid::Copy_plane_permute<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, int, int, int, int, int) [91] | |
0.00 0.00 824/824 void Grid::Copy_plane<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, int, int, int, int) [110] | |
0.00 0.00 840/3206 Grid::GridCartesian::CheckerBoardShiftForCB(int, int, int, int) [144] | |
0.00 0.00 64/224 Grid::GridCartesian::CheckerBoardDestination(int, int, int) [155] | |
----------------------------------------------- | |
0.01 0.00 16/16 void Grid::Cshift_local<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, int, int, int) [90] | |
[91] 0.0 0.01 0.00 16 void Grid::Copy_plane_permute<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, int, int, int, int, int) [91] | |
0.00 0.00 7/54 std::vector<std::pair<int, int>, std::allocator<std::pair<int, int> > >::_M_default_append(unsigned long) [96] | |
0.00 0.00 16/2790 Grid::GridCartesian::CheckerBoarded(int) [146] | |
----------------------------------------------- | |
0.00 0.00 208792/3585944 std::vector<int, std::allocator<int> >::_M_default_append(unsigned long) [22] | |
0.01 0.00 3377152/3585944 void Grid::LatticeCoordinate<Grid::iScalar<Grid::Grid_simd<unsigned int, __Uint32x4_t> > >(Grid::Lattice<Grid::iScalar<Grid::Grid_simd<unsigned int, __Uint32x4_t> > >&, int) [32] | |
[92] 0.0 0.01 0.00 3585944 Grid::CartesianCommunicator::ThisRank() [92] | |
----------------------------------------------- | |
0.01 0.00 190280/190280 std::vector<int, std::allocator<int> >::_M_default_append(unsigned long) [22] | |
[93] 0.0 0.01 0.00 190280 Grid::CartesianCommunicator::RankFromProcessorCoor(std::vector<int, std::allocator<int> >&) [93] | |
----------------------------------------------- | |
0.00 0.00 8800/56064 Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::DhopInternalOverlappedComms(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, int) [109] | |
0.00 0.00 19232/56064 Grid::QCD::WilsonFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::DhopInternalOverlappedComms(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, int) [89] | |
0.00 0.01 28032/56064 void Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloExchangeOpt<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void>&) [95] | |
[94] 0.0 0.00 0.01 56064 void Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::CommsMergeSHM<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void> >(Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void>) [94] | |
0.01 0.00 56064/112128 void Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::CommsMerge<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void> >(Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void>, std::vector<Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::Merge, std::allocator<Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::Merge> >&, std::vector<Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::Decompress, std::allocator<Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::Decompress> >&) [86] | |
0.00 0.00 56064/112128 Grid::CartesianCommunicator::StencilBarrier() [131] | |
----------------------------------------------- | |
0.00 0.00 8800/28032 Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::DhopInternalSerialComms(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, int) [108] | |
0.00 0.01 19232/28032 Grid::QCD::WilsonFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::DhopInternalSerialComms(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, int) [100] | |
[95] 0.0 0.00 0.01 28032 void Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloExchangeOpt<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void>&) [95] | |
0.01 0.00 28032/112128 void Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::CommsMerge<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void> >(Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void>, std::vector<Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::Merge, std::allocator<Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::Merge> >&, std::vector<Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::Decompress, std::allocator<Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::Decompress> >&) [86] | |
0.00 0.01 28032/56064 void Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::CommsMergeSHM<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void> >(Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void>) [94] | |
0.00 0.00 28032/56064 Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::Prepare() [140] | |
0.00 0.00 28032/112128 Grid::CartesianCommunicator::StencilBarrier() [131] | |
0.00 0.00 28032/56064 int Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloGatherDir<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonXmProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonXmProjector, void>&, int, int&) [134] | |
0.00 0.00 28032/56064 int Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloGatherDir<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonYmProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonYmProjector, void>&, int, int&) [136] | |
0.00 0.00 28032/56064 int Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloGatherDir<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonZmProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonZmProjector, void>&, int, int&) [138] | |
0.00 0.00 28032/56064 int Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloGatherDir<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonTmProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonTmProjector, void>&, int, int&) [132] | |
0.00 0.00 28032/56064 int Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloGatherDir<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonXpProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonXpProjector, void>&, int, int&) [135] | |
0.00 0.00 28032/56064 int Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloGatherDir<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonYpProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonYpProjector, void>&, int, int&) [137] | |
0.00 0.00 28032/56064 int Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloGatherDir<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonZpProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonZpProjector, void>&, int, int&) [139] | |
0.00 0.00 28032/56064 int Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloGatherDir<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonTpProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonTpProjector, void>&, int, int&) [133] | |
----------------------------------------------- | |
0.00 0.00 7/54 void Grid::Copy_plane_permute<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, int, int, int, int, int) [91] | |
0.00 0.00 10/54 void Grid::Copy_plane_permute<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >(Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >&, Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > > const&, int, int, int, int, int) [111] | |
0.00 0.00 15/54 void Grid::Copy_plane<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, int, int, int, int) [110] | |
0.00 0.00 22/54 void Grid::Copy_plane<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >(Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >&, Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > > const&, int, int, int, int) [107] | |
[96] 0.0 0.01 0.00 54 std::vector<std::pair<int, int>, std::allocator<std::pair<int, int> > >::_M_default_append(unsigned long) [96] | |
----------------------------------------------- | |
<spontaneous> | |
[97] 0.0 0.01 0.00 Grid::CartesianCommunicator::ShiftedRanks(int, int, int&, int&) [97] | |
----------------------------------------------- | |
<spontaneous> | |
[98] 0.0 0.01 0.00 Grid::CartesianCommunicator::BossRank() [98] | |
----------------------------------------------- | |
<spontaneous> | |
[99] 0.0 0.01 0.00 std::vector<std::vector<ompi_request_t*, std::allocator<ompi_request_t*> >, std::allocator<std::vector<ompi_request_t*, std::allocator<ompi_request_t*> > > >::~vector() [99] | |
----------------------------------------------- | |
0.00 0.01 19232/19232 Grid::QCD::WilsonFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::DhopInternal(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, int) [83] | |
[100] 0.0 0.00 0.01 19232 Grid::QCD::WilsonFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::DhopInternalSerialComms(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, int) [100] | |
0.00 0.01 19232/28032 void Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloExchangeOpt<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void>&) [95] | |
----------------------------------------------- | |
0.00 0.01 17600/17600 Benchmark::DWF5(int, int) [17] | |
[101] 0.0 0.00 0.01 17600 Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::DhopInternal(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, int) [101] | |
0.00 0.00 8800/8800 Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::DhopInternalSerialComms(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, int) [108] | |
0.00 0.00 8800/8800 Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::DhopInternalOverlappedComms(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, int) [109] | |
----------------------------------------------- | |
0.00 0.00 4/20 Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal>::DoubleStore(Grid::GridBase*, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> > const&) [30] | |
0.00 0.00 16/20 Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal>::DoubleStore(Grid::GridBase*, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> > const&) [31] | |
[102] 0.0 0.00 0.01 20 Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >::Lattice(Grid::GridBase*) [102] | |
0.01 0.00 20/424 Grid::alignedAllocator<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >::allocate(unsigned long, void const*) [57] | |
----------------------------------------------- | |
0.00 0.01 48/48 Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > > Grid::Cshift<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >(Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > > const&, int, int) [84] | |
[103] 0.0 0.00 0.01 48 void Grid::Cshift_local<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >(Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >&, Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > > const&, int, int, int) [103] | |
0.00 0.00 618/618 void Grid::Copy_plane<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >(Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >&, Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > > const&, int, int, int, int) [107] | |
0.00 0.00 12/12 void Grid::Copy_plane_permute<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >(Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >&, Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > > const&, int, int, int, int, int) [111] | |
0.00 0.00 630/3206 Grid::GridCartesian::CheckerBoardShiftForCB(int, int, int, int) [144] | |
0.00 0.00 48/224 Grid::GridCartesian::CheckerBoardDestination(int, int, int) [155] | |
0.00 0.00 48/48 Grid::GridBase::PermuteType(int) [175] | |
----------------------------------------------- | |
0.00 0.00 8/24 Benchmark::DWF5(int, int) [17] | |
0.00 0.00 16/24 Benchmark::DWF(int, int, double&) [13] | |
[104] 0.0 0.01 0.00 24 Grid::GridParallelRNG::SeedFixedIntegers(std::vector<int, std::allocator<int> > const&) [104] | |
0.00 0.00 24/296762 sitmo::prng_engine::encrypt_counter() [64] | |
0.00 0.00 24/25 std::seed_seq::seed_seq<__gnu_cxx::__normal_iterator<int const*, std::vector<int, std::allocator<int> > > >(__gnu_cxx::__normal_iterator<int const*, std::vector<int, std::allocator<int> > >, __gnu_cxx::__normal_iterator<int const*, std::vector<int, std::allocator<int> > >) [190] | |
0.00 0.00 24/36 Grid::CartesianCommunicator::BroadcastWorld(int, void*, int) [183] | |
----------------------------------------------- | |
<spontaneous> | |
[105] 0.0 0.01 0.00 Grid::GridRedBlackCartesian::~GridRedBlackCartesian() [105] | |
----------------------------------------------- | |
<spontaneous> | |
[106] 0.0 0.01 0.00 std::ctype<char>::do_widen(char) const [106] | |
----------------------------------------------- | |
0.00 0.00 618/618 void Grid::Cshift_local<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >(Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >&, Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > > const&, int, int, int) [103] | |
[107] 0.0 0.00 0.00 618 void Grid::Copy_plane<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >(Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >&, Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > > const&, int, int, int, int) [107] | |
0.00 0.00 22/54 std::vector<std::pair<int, int>, std::allocator<std::pair<int, int> > >::_M_default_append(unsigned long) [96] | |
0.00 0.00 618/2790 Grid::GridCartesian::CheckerBoarded(int) [146] | |
----------------------------------------------- | |
0.00 0.00 8800/8800 Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::DhopInternal(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, int) [101] | |
[108] 0.0 0.00 0.00 8800 Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::DhopInternalSerialComms(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, int) [108] | |
0.00 0.00 8800/28032 void Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloExchangeOpt<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void>&) [95] | |
----------------------------------------------- | |
0.00 0.00 8800/8800 Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::DhopInternal(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, int) [101] | |
[109] 0.0 0.00 0.00 8800 Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::DhopInternalOverlappedComms(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, int) [109] | |
0.00 0.00 8800/56064 void Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::CommsMergeSHM<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void> >(Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void>) [94] | |
0.00 0.00 8800/112128 void Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::CommsMerge<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void> >(Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void>, std::vector<Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::Merge, std::allocator<Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::Merge> >&, std::vector<Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::Decompress, std::allocator<Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::Decompress> >&) [86] | |
0.00 0.00 8800/56064 Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::Prepare() [140] | |
0.00 0.00 8800/28032 void Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloGatherOpt<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void>&) [142] | |
----------------------------------------------- | |
0.00 0.00 824/824 void Grid::Cshift_local<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, int, int, int) [90] | |
[110] 0.0 0.00 0.00 824 void Grid::Copy_plane<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, int, int, int, int) [110] | |
0.00 0.00 15/54 std::vector<std::pair<int, int>, std::allocator<std::pair<int, int> > >::_M_default_append(unsigned long) [96] | |
0.00 0.00 824/2790 Grid::GridCartesian::CheckerBoarded(int) [146] | |
----------------------------------------------- | |
0.00 0.00 12/12 void Grid::Cshift_local<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >(Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >&, Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > > const&, int, int, int) [103] | |
[111] 0.0 0.00 0.00 12 void Grid::Copy_plane_permute<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >(Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >&, Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > > const&, int, int, int, int, int) [111] | |
0.00 0.00 10/54 std::vector<std::pair<int, int>, std::allocator<std::pair<int, int> > >::_M_default_append(unsigned long) [96] | |
0.00 0.00 12/2790 Grid::GridCartesian::CheckerBoarded(int) [146] | |
----------------------------------------------- | |
0.00 0.00 8/24 Benchmark::DWF5(int, int) [17] | |
0.00 0.00 16/24 Benchmark::DWF(int, int, double&) [13] | |
[112] 0.0 0.00 0.00 24 Grid::QCD::SpaceTimeGrid::makeFourDimGrid(std::vector<int, std::allocator<int> > const&, std::vector<int, std::allocator<int> > const&, std::vector<int, std::allocator<int> > const&) [112] | |
0.00 0.00 288/32499663 std::vector<int, std::allocator<int> >::_M_default_append(unsigned long) [22] | |
0.00 0.00 24/39 Grid::CartesianCommunicator::CartesianCommunicator(std::vector<int, std::allocator<int> > const&) [117] | |
----------------------------------------------- | |
0.00 0.00 8/16 Benchmark::DWF(int, int, double&) [13] | |
0.00 0.00 8/16 Grid::QCD::SpaceTimeGrid::makeFiveDimRedBlackGrid(int, Grid::GridCartesian const*) [41] | |
[113] 0.0 0.00 0.00 16 Grid::QCD::SpaceTimeGrid::makeFiveDimGrid(int, Grid::GridCartesian const*) [113] | |
0.00 0.00 192/32499663 std::vector<int, std::allocator<int> >::_M_default_append(unsigned long) [22] | |
0.00 0.00 16/52 Grid::CartesianCommunicator::CartesianCommunicator(std::vector<int, std::allocator<int> > const&, Grid::CartesianCommunicator const&, int&) [115] | |
0.00 0.00 144/620 void std::vector<int, std::allocator<int> >::_M_realloc_insert<int const&>(__gnu_cxx::__normal_iterator<int*, std::vector<int, std::allocator<int> > >, int const&) [151] | |
----------------------------------------------- | |
0.00 0.00 4/8 Benchmark::DWF5(int, int) [17] | |
0.00 0.00 4/8 Grid::QCD::SpaceTimeGrid::makeFiveDimDWFRedBlackGrid(int, Grid::GridCartesian const*) [40] | |
[114] 0.0 0.00 0.00 8 Grid::QCD::SpaceTimeGrid::makeFiveDimDWFGrid(int, Grid::GridCartesian const*) [114] | |
0.00 0.00 96/32499663 std::vector<int, std::allocator<int> >::_M_default_append(unsigned long) [22] | |
0.00 0.00 8/52 Grid::CartesianCommunicator::CartesianCommunicator(std::vector<int, std::allocator<int> > const&, Grid::CartesianCommunicator const&, int&) [115] | |
0.00 0.00 72/620 void std::vector<int, std::allocator<int> >::_M_realloc_insert<int const&>(__gnu_cxx::__normal_iterator<int*, std::vector<int, std::allocator<int> > >, int const&) [151] | |
----------------------------------------------- | |
0.00 0.00 4/52 Grid::QCD::SpaceTimeGrid::makeFiveDimDWFRedBlackGrid(int, Grid::GridCartesian const*) [40] | |
0.00 0.00 8/52 Grid::QCD::SpaceTimeGrid::makeFiveDimDWFGrid(int, Grid::GridCartesian const*) [114] | |
0.00 0.00 8/52 Grid::QCD::SpaceTimeGrid::makeFiveDimRedBlackGrid(int, Grid::GridCartesian const*) [41] | |
0.00 0.00 16/52 Grid::QCD::SpaceTimeGrid::makeFourDimRedBlackGrid(Grid::GridCartesian const*) [67] | |
0.00 0.00 16/52 Grid::QCD::SpaceTimeGrid::makeFiveDimGrid(int, Grid::GridCartesian const*) [113] | |
[115] 0.0 0.00 0.00 52 Grid::CartesianCommunicator::CartesianCommunicator(std::vector<int, std::allocator<int> > const&, Grid::CartesianCommunicator const&, int&) [115] | |
0.00 0.00 52/91 Grid::SharedMemory::SetCommunicator(ompi_communicator_t*) [116] | |
0.00 0.00 52/52 Grid::CartesianCommunicator::InitFromMPICommunicator(std::vector<int, std::allocator<int> > const&, ompi_communicator_t*) [119] | |
----------------------------------------------- | |
0.00 0.00 39/91 Grid::CartesianCommunicator::CartesianCommunicator(std::vector<int, std::allocator<int> > const&) [117] | |
0.00 0.00 52/91 Grid::CartesianCommunicator::CartesianCommunicator(std::vector<int, std::allocator<int> > const&, Grid::CartesianCommunicator const&, int&) [115] | |
[116] 0.0 0.00 0.00 91 Grid::SharedMemory::SetCommunicator(ompi_communicator_t*) [116] | |
0.00 0.00 91/32499663 std::vector<int, std::allocator<int> >::_M_default_append(unsigned long) [22] | |
0.00 0.00 91/127 Grid::SharedMemory::ShmBufferFreeAll() [160] | |
0.00 0.00 91/92 std::vector<void*, std::allocator<void*> >::_M_default_append(unsigned long) [164] | |
----------------------------------------------- | |
0.00 0.00 4/39 Grid::QCD::SpaceTimeGrid::makeFourDimDWFGrid(std::vector<int, std::allocator<int> > const&, std::vector<int, std::allocator<int> > const&) [118] | |
0.00 0.00 11/39 Benchmark::Memory() [49] | |
0.00 0.00 24/39 Grid::QCD::SpaceTimeGrid::makeFourDimGrid(std::vector<int, std::allocator<int> > const&, std::vector<int, std::allocator<int> > const&, std::vector<int, std::allocator<int> > const&) [112] | |
[117] 0.0 0.00 0.00 39 Grid::CartesianCommunicator::CartesianCommunicator(std::vector<int, std::allocator<int> > const&) [117] | |
0.00 0.00 39/91 Grid::SharedMemory::SetCommunicator(ompi_communicator_t*) [116] | |
0.00 0.00 39/32499663 std::vector<int, std::allocator<int> >::_M_default_append(unsigned long) [22] | |
0.00 0.00 39/39 Grid::GlobalSharedMemory::OptimalCommunicator(std::vector<int, std::allocator<int> > const&, ompi_communicator_t*&) [179] | |
0.00 0.00 39/191 std::vector<int, std::allocator<int> >::operator=(std::vector<int, std::allocator<int> > const&) [157] | |
----------------------------------------------- | |
0.00 0.00 4/4 Benchmark::DWF5(int, int) [17] | |
[118] 0.0 0.00 0.00 4 Grid::QCD::SpaceTimeGrid::makeFourDimDWFGrid(std::vector<int, std::allocator<int> > const&, std::vector<int, std::allocator<int> > const&) [118] | |
0.00 0.00 48/32499663 std::vector<int, std::allocator<int> >::_M_default_append(unsigned long) [22] | |
0.00 0.00 4/39 Grid::CartesianCommunicator::CartesianCommunicator(std::vector<int, std::allocator<int> > const&) [117] | |
----------------------------------------------- | |
0.00 0.00 52/52 Grid::CartesianCommunicator::CartesianCommunicator(std::vector<int, std::allocator<int> > const&, Grid::CartesianCommunicator const&, int&) [115] | |
[119] 0.0 0.00 0.00 52 Grid::CartesianCommunicator::InitFromMPICommunicator(std::vector<int, std::allocator<int> > const&, ompi_communicator_t*) [119] | |
0.00 0.00 52/32499663 std::vector<int, std::allocator<int> >::_M_default_append(unsigned long) [22] | |
0.00 0.00 52/191 std::vector<int, std::allocator<int> >::operator=(std::vector<int, std::allocator<int> > const&) [157] | |
----------------------------------------------- | |
0.00 0.00 1/1 Grid::CartesianCommunicator::Init(int*, char***) [121] | |
[120] 0.0 0.00 0.00 1 Grid::GlobalSharedMemory::Init(ompi_communicator_t*) [120] | |
0.00 0.00 2/32499663 std::vector<int, std::allocator<int> >::_M_default_append(unsigned long) [22] | |
0.00 0.00 1/1 void std::__introsort_loop<__gnu_cxx::__normal_iterator<int*, std::vector<int, std::allocator<int> > >, long, __gnu_cxx::__ops::_Iter_comp_iter<std::less<int> > >(__gnu_cxx::__normal_iterator<int*, std::vector<int, std::allocator<int> > >, __gnu_cxx::__normal_iterator<int*, std::vector<int, std::allocator<int> > >, long, __gnu_cxx::__ops::_Iter_comp_iter<std::less<int> >) [240] | |
----------------------------------------------- | |
0.00 0.00 1/1 Grid::Grid_init(int*, char***) [122] | |
[121] 0.0 0.00 0.00 1 Grid::CartesianCommunicator::Init(int*, char***) [121] | |
0.00 0.00 1/1 Grid::GlobalSharedMemory::Init(ompi_communicator_t*) [120] | |
0.00 0.00 1/2 Grid::Grid_quiesce_nodes() [215] | |
0.00 0.00 1/1 Grid::GlobalSharedMemory::SharedMemoryAllocate(unsigned long, int) [235] | |
----------------------------------------------- | |
<spontaneous> | |
[122] 0.0 0.00 0.00 Grid::Grid_init(int*, char***) [122] | |
0.00 0.00 1/1 Grid::CartesianCommunicator::Init(int*, char***) [121] | |
0.00 0.00 42/42 Grid::Grid_sa_signal_handler(int, siginfo_t*, void*) [178] | |
0.00 0.00 18/22 char** std::__find_if<char**, __gnu_cxx::__ops::_Iter_equals_val<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > const> >(char**, char**, __gnu_cxx::__ops::_Iter_equals_val<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > const>, std::random_access_iterator_tag) [194] | |
0.00 0.00 1/2 Grid::Grid_quiesce_nodes() [215] | |
0.00 0.00 1/1 Grid::CartesianCommunicator::RankWorld() [236] | |
0.00 0.00 1/1 Grid::printHash() [237] | |
0.00 0.00 1/1 Grid::GridCmdOptionCSL(std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> >, std::vector<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> >, std::allocator<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > > >&) [232] | |
0.00 0.00 1/1 Grid::GridLogConfigure(std::vector<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> >, std::allocator<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > > >&) [233] | |
0.00 0.00 1/1 Grid::GridParseLayout(char**, int, std::vector<int, std::allocator<int> >&, std::vector<int, std::allocator<int> >&) [231] | |
0.00 0.00 1/1 Grid::operator<<(std::ostream&, Grid::Logger&) [clone .constprop.140] [238] | |
0.00 0.00 1/1 Grid::GridLogTimestamp(int) [234] | |
----------------------------------------------- | |
0.00 0.00 422144/1266432 void Grid::pokeLocalSite<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8>, Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >(Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> const&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >&, std::vector<int, std::allocator<int> >&) [46] | |
0.00 0.00 844288/1266432 void Grid::peekLocalSite<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4>, Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 4> >(Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 4>&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> > const&, std::vector<int, std::allocator<int> >&) [35] | |
[130] 0.0 0.00 0.00 1266432 Grid::GridCartesian::CheckerBoard(std::vector<int, std::allocator<int> > const&) [130] | |
----------------------------------------------- | |
0.00 0.00 28032/112128 void Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloGatherOpt<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void>&) [142] | |
0.00 0.00 28032/112128 void Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloExchangeOpt<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void>&) [95] | |
0.00 0.00 56064/112128 void Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::CommsMergeSHM<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void> >(Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void>) [94] | |
[131] 0.0 0.00 0.00 112128 Grid::CartesianCommunicator::StencilBarrier() [131] | |
----------------------------------------------- | |
0.00 0.00 28032/56064 void Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloGatherOpt<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void>&) [142] | |
0.00 0.00 28032/56064 void Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloExchangeOpt<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void>&) [95] | |
[132] 0.0 0.00 0.00 56064 int Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloGatherDir<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonTmProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonTmProjector, void>&, int, int&) [132] | |
----------------------------------------------- | |
0.00 0.00 28032/56064 void Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloGatherOpt<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void>&) [142] | |
0.00 0.00 28032/56064 void Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloExchangeOpt<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void>&) [95] | |
[133] 0.0 0.00 0.00 56064 int Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloGatherDir<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonTpProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonTpProjector, void>&, int, int&) [133] | |
----------------------------------------------- | |
0.00 0.00 28032/56064 void Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloGatherOpt<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void>&) [142] | |
0.00 0.00 28032/56064 void Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloExchangeOpt<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void>&) [95] | |
[134] 0.0 0.00 0.00 56064 int Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloGatherDir<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonXmProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonXmProjector, void>&, int, int&) [134] | |
----------------------------------------------- | |
0.00 0.00 28032/56064 void Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloGatherOpt<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void>&) [142] | |
0.00 0.00 28032/56064 void Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloExchangeOpt<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void>&) [95] | |
[135] 0.0 0.00 0.00 56064 int Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloGatherDir<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonXpProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonXpProjector, void>&, int, int&) [135] | |
----------------------------------------------- | |
0.00 0.00 28032/56064 void Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloGatherOpt<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void>&) [142] | |
0.00 0.00 28032/56064 void Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloExchangeOpt<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void>&) [95] | |
[136] 0.0 0.00 0.00 56064 int Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloGatherDir<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonYmProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonYmProjector, void>&, int, int&) [136] | |
----------------------------------------------- | |
0.00 0.00 28032/56064 void Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloGatherOpt<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void>&) [142] | |
0.00 0.00 28032/56064 void Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloExchangeOpt<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void>&) [95] | |
[137] 0.0 0.00 0.00 56064 int Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloGatherDir<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonYpProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonYpProjector, void>&, int, int&) [137] | |
----------------------------------------------- | |
0.00 0.00 28032/56064 void Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloGatherOpt<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void>&) [142] | |
0.00 0.00 28032/56064 void Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloExchangeOpt<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void>&) [95] | |
[138] 0.0 0.00 0.00 56064 int Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloGatherDir<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonZmProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonZmProjector, void>&, int, int&) [138] | |
----------------------------------------------- | |
0.00 0.00 28032/56064 void Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloGatherOpt<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void>&) [142] | |
0.00 0.00 28032/56064 void Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloExchangeOpt<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void>&) [95] | |
[139] 0.0 0.00 0.00 56064 int Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloGatherDir<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonZpProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonZpProjector, void>&, int, int&) [139] | |
----------------------------------------------- | |
0.00 0.00 8800/56064 Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::DhopInternalOverlappedComms(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, int) [109] | |
0.00 0.00 19232/56064 Grid::QCD::WilsonFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::DhopInternalOverlappedComms(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, int) [89] | |
0.00 0.00 28032/56064 void Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloExchangeOpt<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void>&) [95] | |
[140] 0.0 0.00 0.00 56064 Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::Prepare() [140] | |
----------------------------------------------- | |
0.00 0.00 38432/38432 Benchmark::DWF(int, int, double&) [13] | |
[141] 0.0 0.00 0.00 38432 Grid::QCD::WilsonFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::DhopEO(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, int) [141] | |
----------------------------------------------- | |
0.00 0.00 8800/28032 Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::DhopInternalOverlappedComms(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, int) [109] | |
0.00 0.00 19232/28032 Grid::QCD::WilsonFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::DhopInternalOverlappedComms(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, int) [89] | |
[142] 0.0 0.00 0.00 28032 void Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloGatherOpt<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void>&) [142] | |
0.00 0.00 28032/112128 Grid::CartesianCommunicator::StencilBarrier() [131] | |
0.00 0.00 28032/56064 int Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloGatherDir<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonXmProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonXmProjector, void>&, int, int&) [134] | |
0.00 0.00 28032/56064 int Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloGatherDir<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonYmProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonYmProjector, void>&, int, int&) [136] | |
0.00 0.00 28032/56064 int Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloGatherDir<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonZmProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonZmProjector, void>&, int, int&) [138] | |
0.00 0.00 28032/56064 int Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloGatherDir<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonTmProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonTmProjector, void>&, int, int&) [132] | |
0.00 0.00 28032/56064 int Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloGatherDir<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonXpProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonXpProjector, void>&, int, int&) [135] | |
0.00 0.00 28032/56064 int Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloGatherDir<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonYpProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonYpProjector, void>&, int, int&) [137] | |
0.00 0.00 28032/56064 int Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloGatherDir<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonZpProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonZpProjector, void>&, int, int&) [139] | |
0.00 0.00 28032/56064 int Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloGatherDir<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonTpProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonTpProjector, void>&, int, int&) [133] | |
----------------------------------------------- | |
0.00 0.00 17600/17600 Benchmark::DWF5(int, int) [17] | |
[143] 0.0 0.00 0.00 17600 Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::DhopEO(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, int) [143] | |
----------------------------------------------- | |
0.00 0.00 96/3206 Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > > Grid::Cshift<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >(Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > > const&, int, int) [84] | |
0.00 0.00 128/3206 Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > Grid::Cshift<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, int, int) [54] | |
0.00 0.00 630/3206 void Grid::Cshift_local<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >(Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >&, Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > > const&, int, int, int) [103] | |
0.00 0.00 840/3206 void Grid::Cshift_local<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, int, int, int) [90] | |
0.00 0.00 1512/3206 Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::CartesianStencil(Grid::GridBase*, int, int, std::vector<int, std::allocator<int> > const&, std::vector<int, std::allocator<int> > const&) [14] | |
[144] 0.0 0.00 0.00 3206 Grid::GridCartesian::CheckerBoardShiftForCB(int, int, int, int) [144] | |
----------------------------------------------- | |
0.00 0.00 3024/3024 Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::CartesianStencil(Grid::GridBase*, int, int, std::vector<int, std::allocator<int> > const&, std::vector<int, std::allocator<int> > const&) [14] | |
[145] 0.0 0.00 0.00 3024 Grid::GridRedBlackCartesian::CheckerBoardShiftForCB(int, int, int, int) [145] | |
----------------------------------------------- | |
0.00 0.00 12/2790 void Grid::Copy_plane_permute<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >(Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >&, Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > > const&, int, int, int, int, int) [111] | |
0.00 0.00 16/2790 void Grid::Copy_plane_permute<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, int, int, int, int, int) [91] | |
0.00 0.00 618/2790 void Grid::Copy_plane<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >(Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >&, Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > > const&, int, int, int, int) [107] | |
0.00 0.00 824/2790 void Grid::Copy_plane<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, int, int, int, int) [110] | |
0.00 0.00 1320/2790 Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::CartesianStencil(Grid::GridBase*, int, int, std::vector<int, std::allocator<int> > const&, std::vector<int, std::allocator<int> > const&) [14] | |
[146] 0.0 0.00 0.00 2790 Grid::GridCartesian::CheckerBoarded(int) [146] | |
----------------------------------------------- | |
0.00 0.00 2640/2640 Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::CartesianStencil(Grid::GridBase*, int, int, std::vector<int, std::allocator<int> > const&, std::vector<int, std::allocator<int> > const&) [14] | |
[147] 0.0 0.00 0.00 2640 Grid::GridRedBlackCartesian::CheckerBoarded(int) [147] | |
----------------------------------------------- | |
0.00 0.00 12/1325 Grid::alignedAllocator<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >::deallocate(Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8>*, unsigned long) [197] | |
0.00 0.00 24/1325 Grid::alignedAllocator<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >::deallocate(Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8>*, unsigned long) [191] | |
0.00 0.00 33/1325 Grid::alignedAllocator<Grid::iVector<Grid::Grid_simd<float, __Float32x4_t>, 8> >::deallocate(Grid::iVector<Grid::Grid_simd<float, __Float32x4_t>, 8>*, unsigned long) [185] | |
0.00 0.00 36/1325 Grid::alignedAllocator<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> >::deallocate(Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4>*, unsigned long) [182] | |
0.00 0.00 36/1325 Grid::alignedAllocator<Grid::StencilEntry>::deallocate(Grid::StencilEntry*, unsigned long) [181] | |
0.00 0.00 72/1325 Grid::alignedAllocator<Grid::Grid_simd<unsigned int, __Uint32x4_t> >::deallocate(Grid::Grid_simd<unsigned int, __Uint32x4_t>*, unsigned long) [170] | |
0.00 0.00 76/1325 Grid::alignedAllocator<std::complex<double> >::deallocate(std::complex<double>*, unsigned long) [166] | |
0.00 0.00 180/1325 Grid::alignedAllocator<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >::deallocate(Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >*, unsigned long) [158] | |
0.00 0.00 424/1325 Grid::alignedAllocator<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >::deallocate(Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > >*, unsigned long) [154] | |
0.00 0.00 432/1325 Grid::alignedAllocator<Grid::iScalar<Grid::iScalar<Grid::iScalar<Grid::Grid_simd<std::complex<float>, __Float32x4_t> > > > >::deallocate(Grid::iScalar<Grid::iScalar<Grid::iScalar<Grid::Grid_simd<std::complex<float>, __Float32x4_t> > > >*, unsigned long) [152] | |
[148] 0.0 0.00 0.00 1325 Grid::PointerCache::Insert(void*, unsigned long) [148] | |
----------------------------------------------- | |
0.00 0.00 12/1325 Grid::alignedAllocator<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >::allocate(unsigned long, void const*) [87] | |
0.00 0.00 24/1325 Grid::alignedAllocator<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >::allocate(unsigned long, void const*) [71] | |
0.00 0.00 33/1325 Grid::alignedAllocator<Grid::iVector<Grid::Grid_simd<float, __Float32x4_t>, 8> >::allocate(unsigned long, void const*) [78] | |
0.00 0.00 36/1325 Grid::alignedAllocator<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> >::allocate(unsigned long, void const*) [66] | |
0.00 0.00 36/1325 Grid::alignedAllocator<Grid::StencilEntry>::allocate(unsigned long, void const*) [59] | |
0.00 0.00 72/1325 Grid::alignedAllocator<Grid::Grid_simd<unsigned int, __Uint32x4_t> >::allocate(unsigned long, void const*) [171] | |
0.00 0.00 76/1325 Grid::alignedAllocator<std::complex<double> >::allocate(unsigned long, void const*) [167] | |
0.00 0.00 180/1325 Grid::alignedAllocator<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >::allocate(unsigned long, void const*) [42] | |
0.00 0.00 424/1325 Grid::alignedAllocator<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >::allocate(unsigned long, void const*) [57] | |
0.00 0.00 432/1325 Grid::alignedAllocator<Grid::iScalar<Grid::iScalar<Grid::iScalar<Grid::Grid_simd<std::complex<float>, __Float32x4_t> > > > >::allocate(unsigned long, void const*) [153] | |
[149] 0.0 0.00 0.00 1325 Grid::PointerCache::Lookup(unsigned long) [149] | |
----------------------------------------------- | |
0.00 0.00 16/672 Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::Report() [48] | |
0.00 0.00 32/672 Grid::QCD::WilsonFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::Report() [43] | |
0.00 0.00 624/672 Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::Report() [47] | |
[150] 0.0 0.00 0.00 672 Grid::CartesianCommunicator::GlobalSum(double&) [150] | |
----------------------------------------------- | |
0.00 0.00 12/620 Grid::QCD::SpaceTimeGrid::makeFiveDimDWFRedBlackGrid(int, Grid::GridCartesian const*) [40] | |
0.00 0.00 24/620 Grid::QCD::SpaceTimeGrid::makeFiveDimRedBlackGrid(int, Grid::GridCartesian const*) [41] | |
0.00 0.00 72/620 Grid::QCD::SpaceTimeGrid::makeFiveDimDWFGrid(int, Grid::GridCartesian const*) [114] | |
0.00 0.00 144/620 Grid::QCD::SpaceTimeGrid::makeFiveDimGrid(int, Grid::GridCartesian const*) [113] | |
0.00 0.00 368/620 Grid::LebesgueOrder::IterateI(int, int, std::vector<int, std::allocator<int> >&, std::vector<int, std::allocator<int> >&, std::vector<int, std::allocator<int> >&) [50] | |
[151] 0.0 0.00 0.00 620 void std::vector<int, std::allocator<int> >::_M_realloc_insert<int const&>(__gnu_cxx::__normal_iterator<int*, std::vector<int, std::allocator<int> > >, int const&) [151] | |
----------------------------------------------- | |
0.00 0.00 432/432 void Grid::QCD::SU<3>::LieRandomize<Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > > >(Grid::GridParallelRNG&, Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >&, double) [76] | |
[152] 0.0 0.00 0.00 432 Grid::alignedAllocator<Grid::iScalar<Grid::iScalar<Grid::iScalar<Grid::Grid_simd<std::complex<float>, __Float32x4_t> > > > >::deallocate(Grid::iScalar<Grid::iScalar<Grid::iScalar<Grid::Grid_simd<std::complex<float>, __Float32x4_t> > > >*, unsigned long) [152] | |
0.00 0.00 432/1325 Grid::PointerCache::Insert(void*, unsigned long) [148] | |
----------------------------------------------- | |
0.00 0.00 432/432 void Grid::QCD::SU<3>::LieRandomize<Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > > >(Grid::GridParallelRNG&, Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >&, double) [76] | |
[153] 0.0 0.00 0.00 432 Grid::alignedAllocator<Grid::iScalar<Grid::iScalar<Grid::iScalar<Grid::Grid_simd<std::complex<float>, __Float32x4_t> > > > >::allocate(unsigned long, void const*) [153] | |
0.00 0.00 432/1325 Grid::PointerCache::Lookup(unsigned long) [149] | |
----------------------------------------------- | |
0.00 0.00 4/424 Benchmark::DWF5(int, int) [17] | |
0.00 0.00 52/424 Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal>::DoubleStore(Grid::GridBase*, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> > const&) [30] | |
0.00 0.00 112/424 Benchmark::DWF(int, int, double&) [13] | |
0.00 0.00 112/424 Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal>::DoubleStore(Grid::GridBase*, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> > const&) [31] | |
0.00 0.00 144/424 void Grid::QCD::SU<3>::LieRandomize<Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > > >(Grid::GridParallelRNG&, Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >&, double) [76] | |
[154] 0.0 0.00 0.00 424 Grid::alignedAllocator<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >::deallocate(Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > >*, unsigned long) [154] | |
0.00 0.00 424/1325 Grid::PointerCache::Insert(void*, unsigned long) [148] | |
----------------------------------------------- | |
0.00 0.00 48/224 void Grid::Cshift_local<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >(Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >&, Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > > const&, int, int, int) [103] | |
0.00 0.00 48/224 Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > > Grid::Cshift<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >(Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > > const&, int, int) [84] | |
0.00 0.00 64/224 void Grid::Cshift_local<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, int, int, int) [90] | |
0.00 0.00 64/224 Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > Grid::Cshift<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, int, int) [54] | |
[155] 0.0 0.00 0.00 224 Grid::GridCartesian::CheckerBoardDestination(int, int, int) [155] | |
----------------------------------------------- | |
0.00 0.00 216/216 Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::CartesianStencil(Grid::GridBase*, int, int, std::vector<int, std::allocator<int> > const&, std::vector<int, std::allocator<int> > const&) [14] | |
[156] 0.0 0.00 0.00 216 Grid::SharedMemory::ShmBufferMalloc(unsigned long) [156] | |
----------------------------------------------- | |
0.00 0.00 4/191 Grid::QCD::SpaceTimeGrid::makeFiveDimDWFRedBlackGrid(int, Grid::GridCartesian const*) [40] | |
0.00 0.00 8/191 Grid::QCD::SpaceTimeGrid::makeFiveDimRedBlackGrid(int, Grid::GridCartesian const*) [41] | |
0.00 0.00 16/191 Grid::QCD::SpaceTimeGrid::makeFourDimRedBlackGrid(Grid::GridCartesian const*) [67] | |
0.00 0.00 39/191 Grid::CartesianCommunicator::CartesianCommunicator(std::vector<int, std::allocator<int> > const&) [117] | |
0.00 0.00 52/191 Grid::CartesianCommunicator::InitFromMPICommunicator(std::vector<int, std::allocator<int> > const&, ompi_communicator_t*) [119] | |
0.00 0.00 72/191 Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::CartesianStencil(Grid::GridBase*, int, int, std::vector<int, std::allocator<int> > const&, std::vector<int, std::allocator<int> > const&) [14] | |
[157] 0.0 0.00 0.00 191 std::vector<int, std::allocator<int> >::operator=(std::vector<int, std::allocator<int> > const&) [157] | |
----------------------------------------------- | |
0.00 0.00 4/180 Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::~WilsonFermion5D() [209] | |
0.00 0.00 8/180 Grid::QCD::CayleyFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::~CayleyFermion5D() [202] | |
0.00 0.00 32/180 Benchmark::DWF5(int, int) [17] | |
0.00 0.00 136/180 Benchmark::DWF(int, int, double&) [13] | |
[158] 0.0 0.00 0.00 180 Grid::alignedAllocator<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >::deallocate(Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >*, unsigned long) [158] | |
0.00 0.00 180/1325 Grid::PointerCache::Insert(void*, unsigned long) [148] | |
----------------------------------------------- | |
0.00 0.00 48/144 Benchmark::DWF5(int, int) [17] | |
0.00 0.00 96/144 Benchmark::DWF(int, int, double&) [13] | |
[159] 0.0 0.00 0.00 144 Grid::CartesianCommunicator::Barrier() [159] | |
----------------------------------------------- | |
0.00 0.00 36/127 Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::CartesianStencil(Grid::GridBase*, int, int, std::vector<int, std::allocator<int> > const&, std::vector<int, std::allocator<int> > const&) [14] | |
0.00 0.00 91/127 Grid::SharedMemory::SetCommunicator(ompi_communicator_t*) [116] | |
[160] 0.0 0.00 0.00 127 Grid::SharedMemory::ShmBufferFreeAll() [160] | |
----------------------------------------------- | |
0.00 0.00 120/120 Grid::QCD::CayleyFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::SetCoefficientsInternal(double, std::vector<double, std::allocator<double> >&, double, double) [201] | |
[161] 0.0 0.00 0.00 120 std::vector<double, std::allocator<double> >::_M_default_append(unsigned long) [161] | |
----------------------------------------------- | |
0.00 0.00 120/120 Grid::QCD::CayleyFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::SetCoefficientsInternal(double, std::vector<double, std::allocator<double> >&, double, double) [201] | |
[162] 0.0 0.00 0.00 120 std::vector<double, std::allocator<double> >::resize(unsigned long) [162] | |
----------------------------------------------- | |
0.00 0.00 32/104 Benchmark::DWF5(int, int) [17] | |
0.00 0.00 72/104 Benchmark::DWF(int, int, double&) [13] | |
[163] 0.0 0.00 0.00 104 Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >::~Lattice() [163] | |
----------------------------------------------- | |
0.00 0.00 1/92 Grid::GlobalSharedMemory::SharedMemoryAllocate(unsigned long, int) [235] | |
0.00 0.00 91/92 Grid::SharedMemory::SetCommunicator(ompi_communicator_t*) [116] | |
[164] 0.0 0.00 0.00 92 std::vector<void*, std::allocator<void*> >::_M_default_append(unsigned long) [164] | |
----------------------------------------------- | |
0.00 0.00 4/76 Benchmark::DWF5(int, int) [17] | |
0.00 0.00 72/76 Benchmark::DWF(int, int, double&) [13] | |
[165] 0.0 0.00 0.00 76 std::complex<double> Grid::innerProduct<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&) [165] | |
0.00 0.00 76/76 Grid::CartesianCommunicator::GlobalSumVector(double*, int) [168] | |
0.00 0.00 76/76 Grid::CartesianCommunicator::GlobalSum(std::complex<double>&) [169] | |
0.00 0.00 76/76 Grid::alignedAllocator<std::complex<double> >::deallocate(std::complex<double>*, unsigned long) [166] | |
0.00 0.00 76/76 Grid::alignedAllocator<std::complex<double> >::allocate(unsigned long, void const*) [167] | |
----------------------------------------------- | |
0.00 0.00 76/76 std::complex<double> Grid::innerProduct<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&) [165] | |
[166] 0.0 0.00 0.00 76 Grid::alignedAllocator<std::complex<double> >::deallocate(std::complex<double>*, unsigned long) [166] | |
0.00 0.00 76/1325 Grid::PointerCache::Insert(void*, unsigned long) [148] | |
----------------------------------------------- | |
0.00 0.00 76/76 std::complex<double> Grid::innerProduct<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&) [165] | |
[167] 0.0 0.00 0.00 76 Grid::alignedAllocator<std::complex<double> >::allocate(unsigned long, void const*) [167] | |
0.00 0.00 76/1325 Grid::PointerCache::Lookup(unsigned long) [149] | |
----------------------------------------------- | |
0.00 0.00 76/76 std::complex<double> Grid::innerProduct<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&) [165] | |
[168] 0.0 0.00 0.00 76 Grid::CartesianCommunicator::GlobalSumVector(double*, int) [168] | |
----------------------------------------------- | |
0.00 0.00 76/76 std::complex<double> Grid::innerProduct<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&) [165] | |
[169] 0.0 0.00 0.00 76 Grid::CartesianCommunicator::GlobalSum(std::complex<double>&) [169] | |
----------------------------------------------- | |
0.00 0.00 72/72 Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal>::DoubleStore(Grid::GridBase*, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> > const&) [31] | |
[170] 0.0 0.00 0.00 72 Grid::alignedAllocator<Grid::Grid_simd<unsigned int, __Uint32x4_t> >::deallocate(Grid::Grid_simd<unsigned int, __Uint32x4_t>*, unsigned long) [170] | |
0.00 0.00 72/1325 Grid::PointerCache::Insert(void*, unsigned long) [148] | |
----------------------------------------------- | |
0.00 0.00 72/72 Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal>::DoubleStore(Grid::GridBase*, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> > const&) [31] | |
[171] 0.0 0.00 0.00 72 Grid::alignedAllocator<Grid::Grid_simd<unsigned int, __Uint32x4_t> >::allocate(unsigned long, void const*) [171] | |
0.00 0.00 72/1325 Grid::PointerCache::Lookup(unsigned long) [149] | |
----------------------------------------------- | |
0.00 0.00 72/72 Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::CartesianStencil(Grid::GridBase*, int, int, std::vector<int, std::allocator<int> > const&, std::vector<int, std::allocator<int> > const&) [14] | |
[172] 0.0 0.00 0.00 72 std::vector<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >*, std::allocator<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >*> >::_M_default_append(unsigned long) [172] | |
----------------------------------------------- | |
0.00 0.00 7/55 Benchmark::Decomposition() [81] | |
0.00 0.00 16/55 Benchmark::DWF5(int, int) [17] | |
0.00 0.00 32/55 Benchmark::DWF(int, int, double&) [13] | |
[173] 0.0 0.00 0.00 55 Grid::GridCmdVectorIntToString[abi:cxx11](std::vector<int, std::allocator<int> > const&) [173] | |
----------------------------------------------- | |
0.00 0.00 16/48 Benchmark::DWF5(int, int) [17] | |
0.00 0.00 32/48 Benchmark::DWF(int, int, double&) [13] | |
[174] 0.0 0.00 0.00 48 time_statistics::statistics(std::vector<double, std::allocator<double> >) [174] | |
----------------------------------------------- | |
0.00 0.00 48/48 void Grid::Cshift_local<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >(Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >&, Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > > const&, int, int, int) [103] | |
[175] 0.0 0.00 0.00 48 Grid::GridBase::PermuteType(int) [175] | |
----------------------------------------------- | |
0.00 0.00 16/48 Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::Report() [48] | |
0.00 0.00 32/48 Grid::QCD::WilsonFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::Report() [43] | |
[176] 0.0 0.00 0.00 48 std::vector<int, std::allocator<int> >::vector(std::vector<int, std::allocator<int> > const&) [176] | |
----------------------------------------------- | |
0.00 0.00 1/42 Benchmark::Decomposition() [81] | |
0.00 0.00 1/42 Benchmark::Memory() [49] | |
0.00 0.00 16/42 Benchmark::DWF5(int, int) [17] | |
0.00 0.00 24/42 Benchmark::DWF(int, int, double&) [13] | |
[177] 0.0 0.00 0.00 42 Grid::GridDefaultMpi() [177] | |
----------------------------------------------- | |
0.00 0.00 42/42 Grid::Grid_init(int*, char***) [122] | |
[178] 0.0 0.00 0.00 42 Grid::Grid_sa_signal_handler(int, siginfo_t*, void*) [178] | |
----------------------------------------------- | |
0.00 0.00 39/39 Grid::CartesianCommunicator::CartesianCommunicator(std::vector<int, std::allocator<int> > const&) [117] | |
[179] 0.0 0.00 0.00 39 Grid::GlobalSharedMemory::OptimalCommunicator(std::vector<int, std::allocator<int> > const&, ompi_communicator_t*&) [179] | |
----------------------------------------------- | |
0.00 0.00 12/36 Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::~WilsonFermion5D() [209] | |
0.00 0.00 24/36 Grid::QCD::CayleyFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::~CayleyFermion5D() [202] | |
[180] 0.0 0.00 0.00 36 Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::~CartesianStencil() [180] | |
0.00 0.00 36/36 Grid::alignedAllocator<Grid::StencilEntry>::deallocate(Grid::StencilEntry*, unsigned long) [181] | |
----------------------------------------------- | |
0.00 0.00 36/36 Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::~CartesianStencil() [180] | |
[181] 0.0 0.00 0.00 36 Grid::alignedAllocator<Grid::StencilEntry>::deallocate(Grid::StencilEntry*, unsigned long) [181] | |
0.00 0.00 36/1325 Grid::PointerCache::Insert(void*, unsigned long) [148] | |
----------------------------------------------- | |
0.00 0.00 4/36 Benchmark::DWF5(int, int) [17] | |
0.00 0.00 4/36 Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal>::DoubleStore(Grid::GridBase*, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> > const&) [30] | |
0.00 0.00 4/36 Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::ImportGauge(Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> > const&) [29] | |
0.00 0.00 8/36 Grid::QCD::WilsonFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::ImportGauge(Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> > const&) [28] | |
0.00 0.00 16/36 Benchmark::DWF(int, int, double&) [13] | |
[182] 0.0 0.00 0.00 36 Grid::alignedAllocator<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> >::deallocate(Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4>*, unsigned long) [182] | |
0.00 0.00 36/1325 Grid::PointerCache::Insert(void*, unsigned long) [148] | |
----------------------------------------------- | |
0.00 0.00 12/36 Benchmark::Memory() [49] | |
0.00 0.00 24/36 Grid::GridParallelRNG::SeedFixedIntegers(std::vector<int, std::allocator<int> > const&) [104] | |
[183] 0.0 0.00 0.00 36 Grid::CartesianCommunicator::BroadcastWorld(int, void*, int) [183] | |
----------------------------------------------- | |
0.00 0.00 12/36 Benchmark::DWF5(int, int) [17] | |
0.00 0.00 24/36 Benchmark::DWF(int, int, double&) [13] | |
[184] 0.0 0.00 0.00 36 void std::vector<double, std::allocator<double> >::_M_realloc_insert<double const&>(__gnu_cxx::__normal_iterator<double*, std::vector<double, std::allocator<double> > >, double const&) [184] | |
----------------------------------------------- | |
0.00 0.00 33/33 Benchmark::Memory() [49] | |
[185] 0.0 0.00 0.00 33 Grid::alignedAllocator<Grid::iVector<Grid::Grid_simd<float, __Float32x4_t>, 8> >::deallocate(Grid::iVector<Grid::Grid_simd<float, __Float32x4_t>, 8>*, unsigned long) [185] | |
0.00 0.00 33/1325 Grid::PointerCache::Insert(void*, unsigned long) [148] | |
----------------------------------------------- | |
0.00 0.00 32/32 Benchmark::DWF(int, int, double&) [13] | |
[186] 0.0 0.00 0.00 32 Grid::CartesianCommunicator::Broadcast(int, void*, int) [186] | |
----------------------------------------------- | |
0.00 0.00 32/32 Benchmark::DWF(int, int, double&) [13] | |
[187] 0.0 0.00 0.00 32 Grid::QCD::WilsonFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::ZeroCounters() [187] | |
----------------------------------------------- | |
0.00 0.00 32/32 Benchmark::DWF(int, int, double&) [13] | |
[188] 0.0 0.00 0.00 32 Grid::QCD::WilsonFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::DhopOE(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, int) [188] | |
----------------------------------------------- | |
0.00 0.00 1/31 Benchmark::Memory() [49] | |
0.00 0.00 6/31 Benchmark::Decomposition() [81] | |
0.00 0.00 8/31 Benchmark::DWF5(int, int) [17] | |
0.00 0.00 16/31 Benchmark::DWF(int, int, double&) [13] | |
[189] 0.0 0.00 0.00 31 Grid::GridDefaultSimd(int, int) [189] | |
----------------------------------------------- | |
0.00 0.00 1/25 Benchmark::Memory() [49] | |
0.00 0.00 24/25 Grid::GridParallelRNG::SeedFixedIntegers(std::vector<int, std::allocator<int> > const&) [104] | |
[190] 0.0 0.00 0.00 25 std::seed_seq::seed_seq<__gnu_cxx::__normal_iterator<int const*, std::vector<int, std::allocator<int> > > >(__gnu_cxx::__normal_iterator<int const*, std::vector<int, std::allocator<int> > >, __gnu_cxx::__normal_iterator<int const*, std::vector<int, std::allocator<int> > >) [190] | |
----------------------------------------------- | |
0.00 0.00 24/24 Grid::QCD::CayleyFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::~CayleyFermion5D() [202] | |
[191] 0.0 0.00 0.00 24 Grid::alignedAllocator<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >::deallocate(Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8>*, unsigned long) [191] | |
0.00 0.00 24/1325 Grid::PointerCache::Insert(void*, unsigned long) [148] | |
----------------------------------------------- | |
0.00 0.00 23/23 Grid::CartesianCommunicator::~CartesianCommunicator() [193] | |
[192] 0.0 0.00 0.00 23 Grid::SharedMemory::~SharedMemory() [192] | |
----------------------------------------------- | |
0.00 0.00 4/23 Grid::QCD::SpaceTimeGrid::makeFiveDimDWFRedBlackGrid(int, Grid::GridCartesian const*) [40] | |
0.00 0.00 8/23 Grid::QCD::SpaceTimeGrid::makeFiveDimRedBlackGrid(int, Grid::GridCartesian const*) [41] | |
0.00 0.00 11/23 Benchmark::Memory() [49] | |
[193] 0.0 0.00 0.00 23 Grid::CartesianCommunicator::~CartesianCommunicator() [193] | |
0.00 0.00 23/23 Grid::SharedMemory::~SharedMemory() [192] | |
----------------------------------------------- | |
0.00 0.00 4/22 Grid::GridParseLayout(char**, int, std::vector<int, std::allocator<int> >&, std::vector<int, std::allocator<int> >&) [231] | |
0.00 0.00 18/22 Grid::Grid_init(int*, char***) [122] | |
[194] 0.0 0.00 0.00 22 char** std::__find_if<char**, __gnu_cxx::__ops::_Iter_equals_val<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > const> >(char**, char**, __gnu_cxx::__ops::_Iter_equals_val<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > const>, std::random_access_iterator_tag) [194] | |
----------------------------------------------- | |
0.00 0.00 8/16 Grid::QCD::CayleyFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::SetCoefficientsTanh(Grid::Approx::zolotarev_data*, double, double) [200] | |
0.00 0.00 8/16 Grid::QCD::CayleyFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::SetCoefficientsInternal(double, std::vector<double, std::allocator<double> >&, double, double) [201] | |
[195] 0.0 0.00 0.00 16 Grid::QCD::CayleyFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::MooeeInternalCompute(int, int, std::vector<Grid::iScalar<Grid::iScalar<Grid::iScalar<Grid::Grid_simd<std::complex<float>, __Float32x4_t> > > >, Grid::alignedAllocator<Grid::iScalar<Grid::iScalar<Grid::iScalar<Grid::Grid_simd<std::complex<float>, __Float32x4_t> > > > > >&, std::vector<Grid::iScalar<Grid::iScalar<Grid::iScalar<Grid::Grid_simd<std::complex<float>, __Float32x4_t> > > >, Grid::alignedAllocator<Grid::iScalar<Grid::iScalar<Grid::iScalar<Grid::Grid_simd<std::complex<float>, __Float32x4_t> > > > > >&) [195] | |
----------------------------------------------- | |
0.00 0.00 16/16 Benchmark::DWF5(int, int) [17] | |
[196] 0.0 0.00 0.00 16 Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::ZeroCounters() [196] | |
----------------------------------------------- | |
0.00 0.00 12/12 Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::~WilsonFermion5D() [209] | |
[197] 0.0 0.00 0.00 12 Grid::alignedAllocator<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >::deallocate(Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8>*, unsigned long) [197] | |
0.00 0.00 12/1325 Grid::PointerCache::Insert(void*, unsigned long) [148] | |
----------------------------------------------- | |
0.00 0.00 4/12 Benchmark::DWF5(int, int) [17] | |
0.00 0.00 8/12 Benchmark::DWF(int, int, double&) [13] | |
[198] 0.0 0.00 0.00 12 std::vector<std::complex<float>, std::allocator<std::complex<float> > >::_M_fill_insert(__gnu_cxx::__normal_iterator<std::complex<float>*, std::vector<std::complex<float>, std::allocator<std::complex<float> > > >, unsigned long, std::complex<float> const&) [198] | |
----------------------------------------------- | |
0.00 0.00 8/8 Grid::QCD::WilsonFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::WilsonFermion5D(Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> >&, Grid::GridCartesian&, Grid::GridRedBlackCartesian&, Grid::GridCartesian&, Grid::GridRedBlackCartesian&, double, Grid::QCD::WilsonImplParams const&) [16] | |
[199] 0.0 0.00 0.00 8 Grid::QCD::WilsonKernels<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::WilsonKernels(Grid::QCD::WilsonImplParams const&) [199] | |
----------------------------------------------- | |
0.00 0.00 8/8 Benchmark::DWF(int, int, double&) [13] | |
[200] 0.0 0.00 0.00 8 Grid::QCD::CayleyFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::SetCoefficientsTanh(Grid::Approx::zolotarev_data*, double, double) [200] | |
0.00 0.00 8/16 Grid::QCD::CayleyFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::MooeeInternalCompute(int, int, std::vector<Grid::iScalar<Grid::iScalar<Grid::iScalar<Grid::Grid_simd<std::complex<float>, __Float32x4_t> > > >, Grid::alignedAllocator<Grid::iScalar<Grid::iScalar<Grid::iScalar<Grid::Grid_simd<std::complex<float>, __Float32x4_t> > > > > >&, std::vector<Grid::iScalar<Grid::iScalar<Grid::iScalar<Grid::Grid_simd<std::complex<float>, __Float32x4_t> > > >, Grid::alignedAllocator<Grid::iScalar<Grid::iScalar<Grid::iScalar<Grid::Grid_simd<std::complex<float>, __Float32x4_t> > > > > >&) [195] | |
0.00 0.00 8/8 Grid::QCD::CayleyFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::SetCoefficientsInternal(double, std::vector<double, std::allocator<double> >&, double, double) [201] | |
----------------------------------------------- | |
0.00 0.00 8/8 Grid::QCD::CayleyFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::SetCoefficientsTanh(Grid::Approx::zolotarev_data*, double, double) [200] | |
[201] 0.0 0.00 0.00 8 Grid::QCD::CayleyFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::SetCoefficientsInternal(double, std::vector<double, std::allocator<double> >&, double, double) [201] | |
0.00 0.00 120/120 std::vector<double, std::allocator<double> >::_M_default_append(unsigned long) [161] | |
0.00 0.00 120/120 std::vector<double, std::allocator<double> >::resize(unsigned long) [162] | |
0.00 0.00 8/16 Grid::QCD::CayleyFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::MooeeInternalCompute(int, int, std::vector<Grid::iScalar<Grid::iScalar<Grid::iScalar<Grid::Grid_simd<std::complex<float>, __Float32x4_t> > > >, Grid::alignedAllocator<Grid::iScalar<Grid::iScalar<Grid::iScalar<Grid::Grid_simd<std::complex<float>, __Float32x4_t> > > > > >&, std::vector<Grid::iScalar<Grid::iScalar<Grid::iScalar<Grid::Grid_simd<std::complex<float>, __Float32x4_t> > > >, Grid::alignedAllocator<Grid::iScalar<Grid::iScalar<Grid::iScalar<Grid::Grid_simd<std::complex<float>, __Float32x4_t> > > > > >&) [195] | |
----------------------------------------------- | |
0.00 0.00 8/8 Benchmark::DWF(int, int, double&) [13] | |
[202] 0.0 0.00 0.00 8 Grid::QCD::CayleyFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::~CayleyFermion5D() [202] | |
0.00 0.00 24/24 Grid::alignedAllocator<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >::deallocate(Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8>*, unsigned long) [191] | |
0.00 0.00 24/36 Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::~CartesianStencil() [180] | |
0.00 0.00 8/180 Grid::alignedAllocator<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >::deallocate(Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >*, unsigned long) [158] | |
----------------------------------------------- | |
0.00 0.00 8/8 Benchmark::DWF(int, int, double&) [13] | |
[203] 0.0 0.00 0.00 8 Grid::Approx::zolotarev_free(Grid::Approx::zolotarev_data*) [203] | |
----------------------------------------------- | |
0.00 0.00 8/8 Benchmark::DWF(int, int, double&) [13] | |
[204] 0.0 0.00 0.00 8 Grid::Approx::higham(double, int) [204] | |
0.00 0.00 8/8 Grid::Approx::construct_partfrac(Grid::Approx::izd*) [206] | |
0.00 0.00 8/8 Grid::Approx::construct_contfrac(Grid::Approx::izd*) [205] | |
----------------------------------------------- | |
0.00 0.00 8/8 Grid::Approx::higham(double, int) [204] | |
[205] 0.0 0.00 0.00 8 Grid::Approx::construct_contfrac(Grid::Approx::izd*) [205] | |
0.00 0.00 4/4 Grid::Approx::contfrac_A(double*, double*, double*, double*, int, int) [210] | |
----------------------------------------------- | |
0.00 0.00 8/8 Grid::Approx::higham(double, int) [204] | |
[206] 0.0 0.00 0.00 8 Grid::Approx::construct_partfrac(Grid::Approx::izd*) [206] | |
----------------------------------------------- | |
0.00 0.00 4/4 __libc_csu_init [3738] | |
[207] 0.0 0.00 0.00 4 _GLOBAL__sub_I__ZN4Grid3QCD13SpaceTimeGrid15makeFourDimGridERKSt6vectorIiSaIiEES6_S6_ [207] | |
----------------------------------------------- | |
0.00 0.00 4/4 Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::WilsonFermion5D(Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> >&, Grid::GridCartesian&, Grid::GridRedBlackCartesian&, Grid::GridCartesian&, Grid::GridRedBlackCartesian&, double, Grid::QCD::WilsonImplParams const&) [19] | |
[208] 0.0 0.00 0.00 4 Grid::QCD::WilsonKernels<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::WilsonKernels(Grid::QCD::WilsonImplParams const&) [208] | |
----------------------------------------------- | |
0.00 0.00 4/4 Benchmark::DWF5(int, int) [17] | |
[209] 0.0 0.00 0.00 4 Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::~WilsonFermion5D() [209] | |
0.00 0.00 12/12 Grid::alignedAllocator<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >::deallocate(Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8>*, unsigned long) [197] | |
0.00 0.00 12/36 Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::~CartesianStencil() [180] | |
0.00 0.00 4/180 Grid::alignedAllocator<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >::deallocate(Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >*, unsigned long) [158] | |
----------------------------------------------- | |
28 Grid::Approx::contfrac_A(double*, double*, double*, double*, int, int) [210] | |
0.00 0.00 4/4 Grid::Approx::construct_contfrac(Grid::Approx::izd*) [205] | |
[210] 0.0 0.00 0.00 4+28 Grid::Approx::contfrac_A(double*, double*, double*, double*, int, int) [210] | |
28 Grid::Approx::contfrac_A(double*, double*, double*, double*, int, int) [210] | |
----------------------------------------------- | |
0.00 0.00 3/3 Grid::GridCmdOptionCSL(std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> >, std::vector<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> >, std::allocator<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > > >&) [232] | |
[211] 0.0 0.00 0.00 3 void std::vector<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> >, std::allocator<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > > >::_M_realloc_insert<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > const&>(__gnu_cxx::__normal_iterator<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> >*, std::vector<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> >, std::allocator<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > > > >, std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > const&) [211] | |
----------------------------------------------- | |
0.00 0.00 3/3 Grid::Colours::~Colours() [3543] | |
[212] 0.0 0.00 0.00 3 std::_Rb_tree<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> >, std::pair<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > const, std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > >, std::_Select1st<std::pair<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > const, std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > > >, std::less<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > >, std::allocator<std::pair<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > const, std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > > > >::_M_erase(std::_Rb_tree_node<std::pair<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > const, std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > > >*) [212] | |
----------------------------------------------- | |
0.00 0.00 2/2 __libc_csu_init [3738] | |
[213] 0.0 0.00 0.00 2 _GLOBAL__sub_I__ZN4Grid3QCD22StaggeredKernelsStatic3OptE [213] | |
----------------------------------------------- | |
0.00 0.00 2/2 __libc_csu_init [3738] | |
[214] 0.0 0.00 0.00 2 _GLOBAL__sub_I__ZN4Grid3QCD5Gamma3gmuE [214] | |
----------------------------------------------- | |
0.00 0.00 1/2 Grid::Grid_init(int*, char***) [122] | |
0.00 0.00 1/2 Grid::CartesianCommunicator::Init(int*, char***) [121] | |
[215] 0.0 0.00 0.00 2 Grid::Grid_quiesce_nodes() [215] | |
----------------------------------------------- | |
0.00 0.00 1/1 __libc_csu_init [3738] | |
[216] 0.0 0.00 0.00 1 _GLOBAL__sub_I_L_list [216] | |
----------------------------------------------- | |
0.00 0.00 1/1 __libc_csu_init [3738] | |
[217] 0.0 0.00 0.00 1 _GLOBAL__sub_I__ZN4Grid10GridThread8_threadsE [217] | |
----------------------------------------------- | |
0.00 0.00 1/1 __libc_csu_init [3738] | |
[218] 0.0 0.00 0.00 1 _GLOBAL__sub_I__ZN4Grid13LebesgueOrder16UseLebesgueOrderE [218] | |
----------------------------------------------- | |
0.00 0.00 1/1 __libc_csu_init [3738] | |
[219] 0.0 0.00 0.00 1 _GLOBAL__sub_I__ZN4Grid14MemoryProfiler5statsE [219] | |
----------------------------------------------- | |
0.00 0.00 1/1 __libc_csu_init [3738] | |
[220] 0.0 0.00 0.00 1 _GLOBAL__sub_I__ZN4Grid18GlobalSharedMemory17MAX_MPI_SHM_BYTESE [220] | |
----------------------------------------------- | |
0.00 0.00 1/1 __libc_csu_init [3738] | |
[221] 0.0 0.00 0.00 1 _GLOBAL__sub_I__ZN4Grid18GlobalSharedMemory4InitEP19ompi_communicator_t [221] | |
----------------------------------------------- | |
0.00 0.00 1/1 __libc_csu_init [3738] | |
[222] 0.0 0.00 0.00 1 _GLOBAL__sub_I__ZN4Grid21CartesianCommunicator18CommunicatorPolicyE [222] | |
----------------------------------------------- | |
0.00 0.00 1/1 __libc_csu_init [3738] | |
[223] 0.0 0.00 0.00 1 _GLOBAL__sub_I__ZN4Grid21CartesianCommunicator18communicator_worldE [223] | |
----------------------------------------------- | |
0.00 0.00 1/1 __libc_csu_init [3738] | |
[224] 0.0 0.00 0.00 1 _GLOBAL__sub_I__ZN4Grid26Gather_plane_table_computeEPNS_8GridBaseEiiiiRSt6vectorISt4pairIiiESaIS4_EE [224] | |
----------------------------------------------- | |
0.00 0.00 1/1 __libc_csu_init [3738] | |
[225] 0.0 0.00 0.00 1 _GLOBAL__sub_I__ZN4Grid3QCD13WilsonKernelsINS0_17GparityWilsonImplINS_9Grid_simdISt7complexIfE13__Float32x4_tEENS0_14FundamentalRepILi3EEENS0_9CoeffRealEEEE12HandDhopSiteERNS0_13WilsonStencilINS_7iVectorINSE_INSE_IS7_Li3EEELi4EEELi2EEENSE_INSE_ISF_Li2EEELi2EEEEERNS_13LebesgueOrderERNS_7LatticeINSE_INSE_INS_7iScalarINS_7iMatrixIS7_Li3EEEEELi8EEELi2EEEEEPSJ_iiRKNSO_ISH_EERSY_ [225] | |
----------------------------------------------- | |
0.00 0.00 1/1 __libc_csu_init [3738] | |
[226] 0.0 0.00 0.00 1 _GLOBAL__sub_I__ZN4Grid3QCD19WilsonKernelsStatic3OptE [226] | |
----------------------------------------------- | |
0.00 0.00 1/1 __libc_csu_init [3738] | |
[227] 0.0 0.00 0.00 1 _GLOBAL__sub_I__ZN4Grid3QCD21WilsonFermion5DStatic10directionsE [227] | |
----------------------------------------------- | |
0.00 0.00 1/1 __libc_csu_init [3738] | |
[228] 0.0 0.00 0.00 1 _GLOBAL__sub_I__ZN4Grid8demangleB5cxx11EPKc [228] | |
----------------------------------------------- | |
0.00 0.00 1/1 __libc_csu_init [3738] | |
[229] 0.0 0.00 0.00 1 _GLOBAL__sub_I__ZN4Grid9printHashEv [229] | |
----------------------------------------------- | |
0.00 0.00 1/1 __libc_csu_init [3738] | |
[230] 0.0 0.00 0.00 1 __static_initialization_and_destruction_0(int, int) [clone .constprop.58] [230] | |
----------------------------------------------- | |
0.00 0.00 1/1 Grid::Grid_init(int*, char***) [122] | |
[231] 0.0 0.00 0.00 1 Grid::GridParseLayout(char**, int, std::vector<int, std::allocator<int> >&, std::vector<int, std::allocator<int> >&) [231] | |
0.00 0.00 4/22 char** std::__find_if<char**, __gnu_cxx::__ops::_Iter_equals_val<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > const> >(char**, char**, __gnu_cxx::__ops::_Iter_equals_val<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > const>, std::random_access_iterator_tag) [194] | |
----------------------------------------------- | |
0.00 0.00 1/1 Grid::Grid_init(int*, char***) [122] | |
[232] 0.0 0.00 0.00 1 Grid::GridCmdOptionCSL(std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> >, std::vector<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> >, std::allocator<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > > >&) [232] | |
0.00 0.00 3/3 void std::vector<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> >, std::allocator<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > > >::_M_realloc_insert<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > const&>(__gnu_cxx::__normal_iterator<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> >*, std::vector<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> >, std::allocator<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > > > >, std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > const&) [211] | |
----------------------------------------------- | |
0.00 0.00 1/1 Grid::Grid_init(int*, char***) [122] | |
[233] 0.0 0.00 0.00 1 Grid::GridLogConfigure(std::vector<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> >, std::allocator<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > > >&) [233] | |
----------------------------------------------- | |
0.00 0.00 1/1 Grid::Grid_init(int*, char***) [122] | |
[234] 0.0 0.00 0.00 1 Grid::GridLogTimestamp(int) [234] | |
----------------------------------------------- | |
0.00 0.00 1/1 Grid::CartesianCommunicator::Init(int*, char***) [121] | |
[235] 0.0 0.00 0.00 1 Grid::GlobalSharedMemory::SharedMemoryAllocate(unsigned long, int) [235] | |
0.00 0.00 1/92 std::vector<void*, std::allocator<void*> >::_M_default_append(unsigned long) [164] | |
----------------------------------------------- | |
0.00 0.00 1/1 Grid::Grid_init(int*, char***) [122] | |
[236] 0.0 0.00 0.00 1 Grid::CartesianCommunicator::RankWorld() [236] | |
----------------------------------------------- | |
0.00 0.00 1/1 Grid::Grid_init(int*, char***) [122] | |
[237] 0.0 0.00 0.00 1 Grid::printHash() [237] | |
----------------------------------------------- | |
0.00 0.00 1/1 Grid::Grid_init(int*, char***) [122] | |
[238] 0.0 0.00 0.00 1 Grid::operator<<(std::ostream&, Grid::Logger&) [clone .constprop.140] [238] | |
----------------------------------------------- | |
0.00 0.00 1/1 Grid::Grid_unquiesce_nodes() [631] | |
[239] 0.0 0.00 0.00 1 std::_Rb_tree<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> >, std::pair<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > const, std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > >, std::_Select1st<std::pair<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > const, std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > > >, std::less<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > >, std::allocator<std::pair<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > const, std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > > > >::_M_get_insert_unique_pos(std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > const&) [239] | |
----------------------------------------------- | |
0.00 0.00 1/1 Grid::GlobalSharedMemory::Init(ompi_communicator_t*) [120] | |
[240] 0.0 0.00 0.00 1 void std::__introsort_loop<__gnu_cxx::__normal_iterator<int*, std::vector<int, std::allocator<int> > >, long, __gnu_cxx::__ops::_Iter_comp_iter<std::less<int> > >(__gnu_cxx::__normal_iterator<int*, std::vector<int, std::allocator<int> > >, __gnu_cxx::__normal_iterator<int*, std::vector<int, std::allocator<int> > >, long, __gnu_cxx::__ops::_Iter_comp_iter<std::less<int> >) [240] | |
----------------------------------------------- | |
This table describes the call tree of the program, and was sorted by | |
the total amount of time spent in each function and its children. | |
Each entry in this table consists of several lines. The line with the | |
index number at the left hand margin lists the current function. | |
The lines above it list the functions that called this function, | |
and the lines below it list the functions this one called. | |
This line lists: | |
index A unique number given to each element of the table. | |
Index numbers are sorted numerically. | |
The index number is printed next to every function name so | |
it is easier to look up where the function is in the table. | |
% time This is the percentage of the `total' time that was spent | |
in this function and its children. Note that due to | |
different viewpoints, functions excluded by options, etc, | |
these numbers will NOT add up to 100%. | |
self This is the total amount of time spent in this function. | |
children This is the total amount of time propagated into this | |
function by its children. | |
called This is the number of times the function was called. | |
If the function called itself recursively, the number | |
only includes non-recursive calls, and is followed by | |
a `+' and the number of recursive calls. | |
name The name of the current function. The index number is | |
printed after it. If the function is a member of a | |
cycle, the cycle number is printed between the | |
function's name and the index number. | |
For the function's parents, the fields have the following meanings: | |
self This is the amount of time that was propagated directly | |
from the function into this parent. | |
children This is the amount of time that was propagated from | |
the function's children into this parent. | |
called This is the number of times this parent called the | |
function `/' the total number of times the function | |
was called. Recursive calls to the function are not | |
included in the number after the `/'. | |
name This is the name of the parent. The parent's index | |
number is printed after it. If the parent is a | |
member of a cycle, the cycle number is printed between | |
the name and the index number. | |
If the parents of the function cannot be determined, the word | |
`<spontaneous>' is printed in the `name' field, and all the other | |
fields are blank. | |
For the function's children, the fields have the following meanings: | |
self This is the amount of time that was propagated directly | |
from the child into the function. | |
children This is the amount of time that was propagated from the | |
child's children to the function. | |
called This is the number of times the function called | |
this child `/' the total number of times the child | |
was called. Recursive calls by the child are not | |
listed in the number after the `/'. | |
name This is the name of the child. The child's index | |
number is printed after it. If the child is a | |
member of a cycle, the cycle number is printed | |
between the name and the index number. | |
If there are any cycles (circles) in the call graph, there is an | |
entry for the cycle-as-a-whole. This entry shows who called the | |
cycle (as parents) and the members of the cycle (as children.) | |
The `+' recursive calls entry shows the number of function calls that | |
were internal to the cycle, and the calls entry for each member shows, | |
for that member, how many times it was called from other members of | |
the cycle. | |
Copyright (C) 2012-2015 Free Software Foundation, Inc. | |
Copying and distribution of this file, with or without modification, | |
are permitted in any medium without royalty provided the copyright | |
notice and this notice are preserved. | |
Index by function name | |
[216] _GLOBAL__sub_I_L_list [191] Grid::alignedAllocator<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >::deallocate(Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8>*, unsigned long) [20] Grid::QCD::FermionOperator<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::RedBlackGrid() | |
[217] _GLOBAL__sub_I__ZN4Grid10GridThread8_threadsE [71] Grid::alignedAllocator<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >::allocate(unsigned long, void const*) [25] Grid::QCD::FermionOperator<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::MooDeriv(Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> >&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, int) | |
[218] _GLOBAL__sub_I__ZN4Grid13LebesgueOrder16UseLebesgueOrderE [197] Grid::alignedAllocator<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >::deallocate(Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8>*, unsigned long) [28] Grid::QCD::WilsonFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::ImportGauge(Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> > const&) | |
[219] _GLOBAL__sub_I__ZN4Grid14MemoryProfiler5statsE [87] Grid::alignedAllocator<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >::allocate(unsigned long, void const*) [83] Grid::QCD::WilsonFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::DhopInternal(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, int) | |
[220] _GLOBAL__sub_I__ZN4Grid18GlobalSharedMemory17MAX_MPI_SHM_BYTESE [185] Grid::alignedAllocator<Grid::iVector<Grid::Grid_simd<float, __Float32x4_t>, 8> >::deallocate(Grid::iVector<Grid::Grid_simd<float, __Float32x4_t>, 8>*, unsigned long) [187] Grid::QCD::WilsonFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::ZeroCounters() | |
[221] _GLOBAL__sub_I__ZN4Grid18GlobalSharedMemory4InitEP19ompi_communicator_t [78] Grid::alignedAllocator<Grid::iVector<Grid::Grid_simd<float, __Float32x4_t>, 8> >::allocate(unsigned long, void const*) [100] Grid::QCD::WilsonFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::DhopInternalSerialComms(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, int) | |
[222] _GLOBAL__sub_I__ZN4Grid21CartesianCommunicator18CommunicatorPolicyE [170] Grid::alignedAllocator<Grid::Grid_simd<unsigned int, __Uint32x4_t> >::deallocate(Grid::Grid_simd<unsigned int, __Uint32x4_t>*, unsigned long) [89] Grid::QCD::WilsonFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::DhopInternalOverlappedComms(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, int) | |
[223] _GLOBAL__sub_I__ZN4Grid21CartesianCommunicator18communicator_worldE [171] Grid::alignedAllocator<Grid::Grid_simd<unsigned int, __Uint32x4_t> >::allocate(unsigned long, void const*) [141] Grid::QCD::WilsonFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::DhopEO(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, int) | |
[224] _GLOBAL__sub_I__ZN4Grid26Gather_plane_table_computeEPNS_8GridBaseEiiiiRSt6vectorISt4pairIiiESaIS4_EE [166] Grid::alignedAllocator<std::complex<double> >::deallocate(std::complex<double>*, unsigned long) [188] Grid::QCD::WilsonFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::DhopOE(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, int) | |
[207] _GLOBAL__sub_I__ZN4Grid3QCD13SpaceTimeGrid15makeFourDimGridERKSt6vectorIiSaIiEES6_S6_ [167] Grid::alignedAllocator<std::complex<double> >::allocate(unsigned long, void const*) [43] Grid::QCD::WilsonFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::Report() | |
[225] _GLOBAL__sub_I__ZN4Grid3QCD13WilsonKernelsINS0_17GparityWilsonImplINS_9Grid_simdISt7complexIfE13__Float32x4_tEENS0_14FundamentalRepILi3EEENS0_9CoeffRealEEEE12HandDhopSiteERNS0_13WilsonStencilINS_7iVectorINSE_INSE_IS7_Li3EEELi4EEELi2EEENSE_INSE_ISF_Li2EEELi2EEEEERNS_13LebesgueOrderERNS_7LatticeINSE_INSE_INS_7iScalarINS_7iMatrixIS7_Li3EEEEELi8EEELi2EEEEEPSJ_iiRKNSO_ISH_EERSY_ [32] void Grid::LatticeCoordinate<Grid::iScalar<Grid::Grid_simd<unsigned int, __Uint32x4_t> > >(Grid::Lattice<Grid::iScalar<Grid::Grid_simd<unsigned int, __Uint32x4_t> > >&, int) [16] Grid::QCD::WilsonFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::WilsonFermion5D(Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> >&, Grid::GridCartesian&, Grid::GridRedBlackCartesian&, Grid::GridCartesian&, Grid::GridRedBlackCartesian&, double, Grid::QCD::WilsonImplParams const&) | |
[226] _GLOBAL__sub_I__ZN4Grid3QCD19WilsonKernelsStatic3OptE [111] void Grid::Copy_plane_permute<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >(Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >&, Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > > const&, int, int, int, int, int) [2] Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffComplexHalfComms> >::Mdir(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, 3>, 4> > >&, int, int) | |
[227] _GLOBAL__sub_I__ZN4Grid3QCD21WilsonFermion5DStatic10directionsE [91] void Grid::Copy_plane_permute<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, int, int, int, int, int) [3] Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffComplexHalfComms> >::WilsonFermion5D(Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, 3> >, 4> >&, Grid::GridCartesian&, Grid::GridRedBlackCartesian&, Grid::GridCartesian&, Grid::GridRedBlackCartesian&, double, Grid::QCD::WilsonImplParams const&) | |
[213] _GLOBAL__sub_I__ZN4Grid3QCD22StaggeredKernelsStatic3OptE [179] Grid::GlobalSharedMemory::OptimalCommunicator(std::vector<int, std::allocator<int> > const&, ompi_communicator_t*&) [29] Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::ImportGauge(Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> > const&) | |
[214] _GLOBAL__sub_I__ZN4Grid3QCD5Gamma3gmuE [235] Grid::GlobalSharedMemory::SharedMemoryAllocate(unsigned long, int) [101] Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::DhopInternal(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, int) | |
[228] _GLOBAL__sub_I__ZN4Grid8demangleB5cxx11EPKc [120] Grid::GlobalSharedMemory::Init(ompi_communicator_t*) [196] Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::ZeroCounters() | |
[229] _GLOBAL__sub_I__ZN4Grid9printHashEv [215] Grid::Grid_quiesce_nodes() [108] Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::DhopInternalSerialComms(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, int) | |
[230] __static_initialization_and_destruction_0(int, int) [clone .constprop.58] [97] Grid::CartesianCommunicator::ShiftedRanks(int, int, int&, int&) [109] Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::DhopInternalOverlappedComms(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, int) | |
[174] time_statistics::statistics(std::vector<double, std::allocator<double> >) [183] Grid::CartesianCommunicator::BroadcastWorld(int, void*, int) [143] Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::DhopEO(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, int) | |
[85] Grid::Grid_simd<unsigned int, __Uint32x4_t> Grid::Comparison<Grid::seq<unsigned int, unsigned int>, Grid::Grid_simd<unsigned int, __Uint32x4_t>, 0>(Grid::seq<unsigned int, unsigned int>, Grid::Grid_simd<unsigned int, __Uint32x4_t> const&, Grid::Grid_simd<unsigned int, __Uint32x4_t>::scalar_type const&) [131] Grid::CartesianCommunicator::StencilBarrier() [48] Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::Report() | |
[107] void Grid::Copy_plane<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >(Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >&, Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > > const&, int, int, int, int) [168] Grid::CartesianCommunicator::GlobalSumVector(double*, int) [19] Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::WilsonFermion5D(Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> >&, Grid::GridCartesian&, Grid::GridRedBlackCartesian&, Grid::GridCartesian&, Grid::GridRedBlackCartesian&, double, Grid::QCD::WilsonImplParams const&) | |
[110] void Grid::Copy_plane<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, int, int, int, int) [61] Grid::CartesianCommunicator::ProcessorCoorFromRank(int, std::vector<int, std::allocator<int> >&) [209] Grid::QCD::WilsonFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::~WilsonFermion5D() | |
[27] Grid::GridRNGbase::~GridRNGbase() [93] Grid::CartesianCommunicator::RankFromProcessorCoor(std::vector<int, std::allocator<int> >&) [12] Grid::QCD::DomainWallFermion<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::MomentumSpacePropagator(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, double) | |
[103] void Grid::Cshift_local<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >(Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >&, Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > > const&, int, int, int) [119] Grid::CartesianCommunicator::InitFromMPICommunicator(std::vector<int, std::allocator<int> > const&, ompi_communicator_t*) [30] Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal>::DoubleStore(Grid::GridBase*, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> > const&) | |
[90] void Grid::Cshift_local<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, int, int, int) [121] Grid::CartesianCommunicator::Init(int*, char***) [76] void Grid::QCD::SU<3>::LieRandomize<Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > > >(Grid::GridParallelRNG&, Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >&, double) | |
[148] Grid::PointerCache::Insert(void*, unsigned long) [159] Grid::CartesianCommunicator::Barrier() [26] std::enable_if<Grid::matchGridTensorIndex<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4>, 2>::value, Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >::type Grid::QCD::operator*<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >(Grid::QCD::Gamma const&, Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> const&) | |
[149] Grid::PointerCache::Lookup(unsigned long) [98] Grid::CartesianCommunicator::BossRank() [203] Grid::Approx::zolotarev_free(Grid::Approx::zolotarev_data*) | |
[116] Grid::SharedMemory::SetCommunicator(ompi_communicator_t*) [92] Grid::CartesianCommunicator::ThisRank() [204] Grid::Approx::higham(double, int) | |
[156] Grid::SharedMemory::ShmBufferMalloc(unsigned long) [186] Grid::CartesianCommunicator::Broadcast(int, void*, int) [210] Grid::Approx::contfrac_A(double*, double*, double*, double*, int, int) | |
[160] Grid::SharedMemory::ShmBufferFreeAll() [169] Grid::CartesianCommunicator::GlobalSum(std::complex<double>&) [205] Grid::Approx::construct_contfrac(Grid::Approx::izd*) | |
[192] Grid::SharedMemory::~SharedMemory() [150] Grid::CartesianCommunicator::GlobalSum(double&) [206] Grid::Approx::construct_partfrac(Grid::Approx::izd*) | |
[165] std::complex<double> Grid::innerProduct<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&) [236] Grid::CartesianCommunicator::RankWorld() [84] Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > > Grid::Cshift<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >(Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > > const&, int, int) | |
[130] Grid::GridCartesian::CheckerBoard(std::vector<int, std::allocator<int> > const&) [115] Grid::CartesianCommunicator::CartesianCommunicator(std::vector<int, std::allocator<int> > const&, Grid::CartesianCommunicator const&, int&) [54] Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > Grid::Cshift<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, int, int) | |
[146] Grid::GridCartesian::CheckerBoarded(int) [117] Grid::CartesianCommunicator::CartesianCommunicator(std::vector<int, std::allocator<int> > const&) [102] Grid::Lattice<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >::Lattice(Grid::GridBase*) | |
[144] Grid::GridCartesian::CheckerBoardShiftForCB(int, int, int, int) [193] Grid::CartesianCommunicator::~CartesianCommunicator() [45] Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >::Lattice(Grid::GridBase*) | |
[155] Grid::GridCartesian::CheckerBoardDestination(int, int, int) [63] Grid::GridRedBlackCartesian::CheckerBoard(std::vector<int, std::allocator<int> > const&) [163] Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >::~Lattice() | |
[52] Grid::LebesgueOrder::CartesianBlocking() [147] Grid::GridRedBlackCartesian::CheckerBoarded(int) [72] Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >::Lattice(Grid::GridBase*) | |
[50] Grid::LebesgueOrder::IterateI(int, int, std::vector<int, std::allocator<int> >&, std::vector<int, std::allocator<int> >&, std::vector<int, std::allocator<int> >&) [18] Grid::GridRedBlackCartesian::CheckerBoardFromOindex(int) [88] Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >::Lattice(Grid::GridBase*) | |
[51] Grid::LebesgueOrder::IterateO(int, int, std::vector<int, std::allocator<int> >&, std::vector<int, std::allocator<int> >&, std::vector<int, std::allocator<int> >&) [145] Grid::GridRedBlackCartesian::CheckerBoardShiftForCB(int, int, int, int) [21] Grid::permute(Grid::Grid_simd<std::complex<float>, __Float32x4_t>&, Grid::Grid_simd<std::complex<float>, __Float32x4_t>, int) | |
[53] Grid::LebesgueOrder::LebesgueOrder(Grid::GridBase*) [62] Grid::GridRedBlackCartesian::oIndex(std::vector<int, std::allocator<int> >&) [175] Grid::GridBase::PermuteType(int) | |
[35] void Grid::peekLocalSite<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4>, Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 4> >(Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 4>&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> > const&, std::vector<int, std::allocator<int> >&) [105] Grid::GridRedBlackCartesian::~GridRedBlackCartesian() [55] Grid::GridBase::iIndex(std::vector<int, std::allocator<int> >&) | |
[46] void Grid::pokeLocalSite<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8>, Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >(Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> const&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >&, std::vector<int, std::allocator<int> >&) [178] Grid::Grid_sa_signal_handler(int, siginfo_t*, void*) [56] Grid::GridBase::oIndex(std::vector<int, std::allocator<int> >&) | |
[177] Grid::GridDefaultMpi() [173] Grid::GridCmdVectorIntToString[abi:cxx11](std::vector<int, std::allocator<int> > const&) [237] Grid::printHash() | |
[189] Grid::GridDefaultSimd(int, int) [73] Grid::Gather_plane_table_compute(Grid::GridBase*, int, int, int, int, std::vector<std::pair<int, int>, std::allocator<std::pair<int, int> > >&) [238] Grid::operator<<(std::ostream&, Grid::Logger&) [clone .constprop.140] | |
[104] Grid::GridParallelRNG::SeedFixedIntegers(std::vector<int, std::allocator<int> > const&) [31] Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal>::DoubleStore(Grid::GridBase*, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> > const&) [64] sitmo::prng_engine::encrypt_counter() | |
[33] Grid::GridParallelRNG::GridParallelRNG(Grid::GridBase*) [113] Grid::QCD::SpaceTimeGrid::makeFiveDimGrid(int, Grid::GridCartesian const*) [13] Benchmark::DWF(int, int, double&) | |
[231] Grid::GridParseLayout(char**, int, std::vector<int, std::allocator<int> >&, std::vector<int, std::allocator<int> >&) [112] Grid::QCD::SpaceTimeGrid::makeFourDimGrid(std::vector<int, std::allocator<int> > const&, std::vector<int, std::allocator<int> > const&, std::vector<int, std::allocator<int> > const&) [49] Benchmark::Memory() | |
[65] Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > const Grid::predicatedWhere<Grid::Grid_simd<unsigned int, __Uint32x4_t> const&, Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > const, Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > const>(Grid::Grid_simd<unsigned int, __Uint32x4_t> const& const&, Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > const&, Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > const&) [114] Grid::QCD::SpaceTimeGrid::makeFiveDimDWFGrid(int, Grid::GridCartesian const*) [106] std::ctype<char>::do_widen(char) const | |
[86] void Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::CommsMerge<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void> >(Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void>, std::vector<Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::Merge, std::allocator<Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::Merge> >&, std::vector<Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::Decompress, std::allocator<Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::Decompress> >&) [118] Grid::QCD::SpaceTimeGrid::makeFourDimDWFGrid(std::vector<int, std::allocator<int> > const&, std::vector<int, std::allocator<int> > const&) [60] std::vector<Grid::StencilEntry, Grid::alignedAllocator<Grid::StencilEntry> >::_M_default_append(unsigned long) | |
[94] void Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::CommsMergeSHM<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void> >(Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void>) [41] Grid::QCD::SpaceTimeGrid::makeFiveDimRedBlackGrid(int, Grid::GridCartesian const*) [211] void std::vector<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> >, std::allocator<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > > >::_M_realloc_insert<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > const&>(__gnu_cxx::__normal_iterator<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> >*, std::vector<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> >, std::allocator<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > > > >, std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > const&) | |
[132] int Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloGatherDir<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonTmProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonTmProjector, void>&, int, int&) [67] Grid::QCD::SpaceTimeGrid::makeFourDimRedBlackGrid(Grid::GridCartesian const*) [172] std::vector<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >*, std::allocator<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >*> >::_M_default_append(unsigned long) | |
[133] int Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloGatherDir<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonTpProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonTpProjector, void>&, int, int&) [40] Grid::QCD::SpaceTimeGrid::makeFiveDimDWFRedBlackGrid(int, Grid::GridCartesian const*) [164] std::vector<void*, std::allocator<void*> >::_M_default_append(unsigned long) | |
[134] int Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloGatherDir<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonXmProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonXmProjector, void>&, int, int&) [44] Grid::QCD::WilsonKernels<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, Grid::QCD::TwoIndexRep<3, (Grid::QCD::TwoIndexSymmetry)1>, Grid::QCD::CoeffReal> >::ContractConservedCurrentSiteBwd(Grid::iScalar<Grid::iMatrix<Grid::iMatrix<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, 6>, 4> > const&, Grid::iScalar<Grid::iMatrix<Grid::iMatrix<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, 6>, 4> > const&, Grid::iScalar<Grid::iMatrix<Grid::iMatrix<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, 6>, 4> >&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, 6> >, 8> >&, unsigned int, unsigned int, bool) [99] std::vector<std::vector<ompi_request_t*, std::allocator<ompi_request_t*> >, std::allocator<std::vector<ompi_request_t*, std::allocator<ompi_request_t*> > > >::~vector() | |
[135] int Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloGatherDir<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonXpProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonXpProjector, void>&, int, int&) [74] Grid::QCD::WilsonKernels<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffComplex> >::HandDhopSiteDagExt(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, 3> >, 8> >&, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, 3>, 2> >*, int, int, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<double>, __Float64x2_t>, 3>, 4> > >&) [58] std::vector<std::normal_distribution<double>, std::allocator<std::normal_distribution<double> > >::_M_fill_insert(__gnu_cxx::__normal_iterator<std::normal_distribution<double>*, std::vector<std::normal_distribution<double>, std::allocator<std::normal_distribution<double> > > >, unsigned long, std::normal_distribution<double> const&) | |
[136] int Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloGatherDir<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonYmProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonYmProjector, void>&, int, int&) [75] Grid::QCD::WilsonKernels<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::TwoIndexRep<3, (Grid::QCD::TwoIndexSymmetry)-1>, Grid::QCD::CoeffReal> >::DhopDir(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >&, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >*, int, int, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, int, int) [34] std::vector<std::discrete_distribution<int>, std::allocator<std::discrete_distribution<int> > >::_M_fill_insert(__gnu_cxx::__normal_iterator<std::discrete_distribution<int>*, std::vector<std::discrete_distribution<int>, std::allocator<std::discrete_distribution<int> > > >, unsigned long, std::discrete_distribution<int> const&) | |
[137] int Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloGatherDir<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonYpProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonYpProjector, void>&, int, int&) [9] Grid::QCD::WilsonKernels<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::HandDhopSite(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >&, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >*, int, int, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&) [70] std::vector<std::uniform_int_distribution<unsigned int>, std::allocator<std::uniform_int_distribution<unsigned int> > >::_M_fill_insert(__gnu_cxx::__normal_iterator<std::uniform_int_distribution<unsigned int>*, std::vector<std::uniform_int_distribution<unsigned int>, std::allocator<std::uniform_int_distribution<unsigned int> > > >, unsigned long, std::uniform_int_distribution<unsigned int> const&) | |
[138] int Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloGatherDir<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonZmProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonZmProjector, void>&, int, int&) [8] Grid::QCD::WilsonKernels<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::GenericDhopSite(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >&, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >*, int, int, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&) [79] std::vector<std::uniform_real_distribution<double>, std::allocator<std::uniform_real_distribution<double> > >::_M_fill_insert(__gnu_cxx::__normal_iterator<std::uniform_real_distribution<double>*, std::vector<std::uniform_real_distribution<double>, std::allocator<std::uniform_real_distribution<double> > > >, unsigned long, std::uniform_real_distribution<double> const&) | |
[139] int Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloGatherDir<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonZpProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonZpProjector, void>&, int, int&) [80] Grid::QCD::WilsonKernels<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::HandDhopSiteDag(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >&, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >*, int, int, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&) [96] std::vector<std::pair<int, int>, std::allocator<std::pair<int, int> > >::_M_default_append(unsigned long) | |
[36] Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::BuildSurfaceList(int, int) [7] Grid::QCD::WilsonKernels<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::HandDhopSiteInt(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >&, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >*, int, int, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&) [198] std::vector<std::complex<float>, std::allocator<std::complex<float> > >::_M_fill_insert(__gnu_cxx::__normal_iterator<std::complex<float>*, std::vector<std::complex<float>, std::allocator<std::complex<float> > > >, unsigned long, std::complex<float> const&) | |
[1] Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::CommunicateThreaded() [4] Grid::QCD::WilsonKernels<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::GenericDhopSiteInt(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 8> >&, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >*, int, int, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&) [161] std::vector<double, std::allocator<double> >::_M_default_append(unsigned long) | |
[47] Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::Report() [199] Grid::QCD::WilsonKernels<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::WilsonKernels(Grid::QCD::WilsonImplParams const&) [184] void std::vector<double, std::allocator<double> >::_M_realloc_insert<double const&>(__gnu_cxx::__normal_iterator<double*, std::vector<double, std::allocator<double> > >, double const&) | |
[140] Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::Prepare() [11] Grid::QCD::WilsonKernels<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::HandDhopSite(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >&, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >*, int, int, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&) [162] std::vector<double, std::allocator<double> >::resize(unsigned long) | |
[14] Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::CartesianStencil(Grid::GridBase*, int, int, std::vector<int, std::allocator<int> > const&, std::vector<int, std::allocator<int> > const&) [5] Grid::QCD::WilsonKernels<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::GenericDhopSite(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >&, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >*, int, int, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&) [22] std::vector<int, std::allocator<int> >::_M_default_append(unsigned long) | |
[180] Grid::CartesianStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::~CartesianStencil() [68] Grid::QCD::WilsonKernels<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::HandDhopSiteDag(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >&, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >*, int, int, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&) [151] void std::vector<int, std::allocator<int> >::_M_realloc_insert<int const&>(__gnu_cxx::__normal_iterator<int*, std::vector<int, std::allocator<int> > >, int const&) | |
[232] Grid::GridCmdOptionCSL(std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> >, std::vector<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> >, std::allocator<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > > >&) [10] Grid::QCD::WilsonKernels<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::HandDhopSiteInt(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >&, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >*, int, int, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&) [176] std::vector<int, std::allocator<int> >::vector(std::vector<int, std::allocator<int> > const&) | |
[233] Grid::GridLogConfigure(std::vector<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> >, std::allocator<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > > >&) [6] Grid::QCD::WilsonKernels<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::GenericDhopSiteInt(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::LebesgueOrder&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >&, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >*, int, int, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&) [157] std::vector<int, std::allocator<int> >::operator=(std::vector<int, std::allocator<int> > const&) | |
[234] Grid::GridLogTimestamp(int) [82] Grid::QCD::WilsonKernels<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::DhopDir(Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >&, Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<std::complex<float>, 3> >, 8> >&, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >*, int, int, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, int, int) [239] std::_Rb_tree<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> >, std::pair<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > const, std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > >, std::_Select1st<std::pair<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > const, std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > > >, std::less<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > >, std::allocator<std::pair<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > const, std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > > > >::_M_get_insert_unique_pos(std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > const&) | |
[181] Grid::alignedAllocator<Grid::StencilEntry>::deallocate(Grid::StencilEntry*, unsigned long) [208] Grid::QCD::WilsonKernels<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::WilsonKernels(Grid::QCD::WilsonImplParams const&) [212] std::_Rb_tree<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> >, std::pair<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > const, std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > >, std::_Select1st<std::pair<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > const, std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > > >, std::less<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > >, std::allocator<std::pair<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > const, std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > > > >::_M_erase(std::_Rb_tree_node<std::pair<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > const, std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > > >*) | |
[59] Grid::alignedAllocator<Grid::StencilEntry>::allocate(unsigned long, void const*) [142] void Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloGatherOpt<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void>&) [190] std::seed_seq::seed_seq<__gnu_cxx::__normal_iterator<int const*, std::vector<int, std::allocator<int> > > >(__gnu_cxx::__normal_iterator<int const*, std::vector<int, std::allocator<int> > >, __gnu_cxx::__normal_iterator<int const*, std::vector<int, std::allocator<int> > >) | |
[152] Grid::alignedAllocator<Grid::iScalar<Grid::iScalar<Grid::iScalar<Grid::Grid_simd<std::complex<float>, __Float32x4_t> > > > >::deallocate(Grid::iScalar<Grid::iScalar<Grid::iScalar<Grid::Grid_simd<std::complex<float>, __Float32x4_t> > > >*, unsigned long) [95] void Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::HaloExchangeOpt<Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void> >(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::QCD::WilsonCompressorTemplate<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::QCD::WilsonProjector, void>&) [240] void std::__introsort_loop<__gnu_cxx::__normal_iterator<int*, std::vector<int, std::allocator<int> > >, long, __gnu_cxx::__ops::_Iter_comp_iter<std::less<int> > >(__gnu_cxx::__normal_iterator<int*, std::vector<int, std::allocator<int> > >, __gnu_cxx::__normal_iterator<int*, std::vector<int, std::allocator<int> > >, long, __gnu_cxx::__ops::_Iter_comp_iter<std::less<int> >) | |
[153] Grid::alignedAllocator<Grid::iScalar<Grid::iScalar<Grid::iScalar<Grid::Grid_simd<std::complex<float>, __Float32x4_t> > > > >::allocate(unsigned long, void const*) [77] Grid::QCD::WilsonStencil<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >, Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 2> > >::Reporti(int) [194] char** std::__find_if<char**, __gnu_cxx::__ops::_Iter_equals_val<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > const> >(char**, char**, __gnu_cxx::__ops::_Iter_equals_val<std::__cxx11::basic_string<char, std::char_traits<char>, std::allocator<char> > const>, std::random_access_iterator_tag) | |
[154] Grid::alignedAllocator<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >::deallocate(Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > >*, unsigned long) [200] Grid::QCD::CayleyFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::SetCoefficientsTanh(Grid::Approx::zolotarev_data*, double, double) [69] __divdc3 | |
[57] Grid::alignedAllocator<Grid::iScalar<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> > > >::allocate(unsigned long, void const*) [195] Grid::QCD::CayleyFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::MooeeInternalCompute(int, int, std::vector<Grid::iScalar<Grid::iScalar<Grid::iScalar<Grid::Grid_simd<std::complex<float>, __Float32x4_t> > > >, Grid::alignedAllocator<Grid::iScalar<Grid::iScalar<Grid::iScalar<Grid::Grid_simd<std::complex<float>, __Float32x4_t> > > > > >&, std::vector<Grid::iScalar<Grid::iScalar<Grid::iScalar<Grid::Grid_simd<std::complex<float>, __Float32x4_t> > > >, Grid::alignedAllocator<Grid::iScalar<Grid::iScalar<Grid::iScalar<Grid::Grid_simd<std::complex<float>, __Float32x4_t> > > > > >&) [39] __extenddftf2 | |
[158] Grid::alignedAllocator<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >::deallocate(Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> >*, unsigned long) [201] Grid::QCD::CayleyFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::SetCoefficientsInternal(double, std::vector<double, std::allocator<double> >&, double, double) [24] __multf3 | |
[42] Grid::alignedAllocator<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >::allocate(unsigned long, void const*) [15] Grid::QCD::CayleyFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::CayleyFermion5D(Grid::Lattice<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> >&, Grid::GridCartesian&, Grid::GridRedBlackCartesian&, Grid::GridCartesian&, Grid::GridRedBlackCartesian&, double, double, Grid::QCD::WilsonImplParams const&) [37] __trunctfdf2 | |
[182] Grid::alignedAllocator<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> >::deallocate(Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4>*, unsigned long) [202] Grid::QCD::CayleyFermion5D<Grid::QCD::WilsonImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffReal> >::~CayleyFermion5D() [23] frame_dummy | |
[66] Grid::alignedAllocator<Grid::iVector<Grid::iScalar<Grid::iMatrix<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3> >, 4> >::allocate(unsigned long, void const*) [38] Grid::QCD::CayleyFermion5D<Grid::QCD::DomainWallVec5dImpl<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, Grid::QCD::FundamentalRep<3>, Grid::QCD::CoeffComplexHalfComms> >::M5D(Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > > const&, Grid::Lattice<Grid::iScalar<Grid::iVector<Grid::iVector<Grid::Grid_simd<std::complex<float>, __Float32x4_t>, 3>, 4> > >&, std::vector<std::complex<double>, std::allocator<std::complex<double> > >&, std::vector<std::complex<double>, std::allocator<std::complex<double> > >&, std::vector<std::complex<double>, std::allocator<std::complex<double> > >&) |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment