//@HEADER // ************************************************************************ // // Kokkos v. 4.0 // Copyright (2022) National Technology & Engineering // Solutions of Sandia, LLC (NTESS). // // Under the terms of Contract DE-NA0003525 with NTESS, // the U.S. Government retains certain rights in this software. // // Part of Kokkos, under the Apache License v2.0 with LLVM Exceptions. // See https://kokkos.org/LICENSE for license information. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception // //@HEADER #include namespace Test { namespace stdalgos { namespace TeamCopyIf { namespace KE = Kokkos::Experimental; template struct GreaterThanValueFunctor { ValueType m_val; KOKKOS_INLINE_FUNCTION GreaterThanValueFunctor(ValueType val) : m_val(val) {} KOKKOS_INLINE_FUNCTION bool operator()(ValueType val) const { return (val > m_val); } }; template struct TestFunctorA { SourceViewType m_sourceView; DestViewType m_destView; DistancesViewType m_distancesView; IntraTeamSentinelView m_intraTeamSentinelView; ValueType m_threshold; int m_apiPick; TestFunctorA(const SourceViewType sourceView, const DestViewType destView, const DistancesViewType distancesView, const IntraTeamSentinelView intraTeamSentinelView, ValueType threshold, int apiPick) : m_sourceView(sourceView), m_destView(destView), m_distancesView(distancesView), m_intraTeamSentinelView(intraTeamSentinelView), m_threshold(threshold), m_apiPick(apiPick) {} template KOKKOS_INLINE_FUNCTION void operator()(const MemberType& member) const { const auto myRowIndex = member.league_rank(); auto myRowViewFrom = Kokkos::subview(m_sourceView, myRowIndex, Kokkos::ALL()); auto myRowViewDest = Kokkos::subview(m_destView, myRowIndex, Kokkos::ALL()); GreaterThanValueFunctor predicate(m_threshold); ptrdiff_t resultDist = 0; if (m_apiPick == 0) { auto it = KE::copy_if(member, KE::begin(myRowViewFrom), KE::end(myRowViewFrom), KE::begin(myRowViewDest), predicate); resultDist = KE::distance(KE::begin(myRowViewDest), it); Kokkos::single(Kokkos::PerTeam(member), [=, *this]() { m_distancesView(myRowIndex) = resultDist; }); } else if (m_apiPick == 1) { auto it = KE::copy_if(member, myRowViewFrom, myRowViewDest, predicate); resultDist = KE::distance(KE::begin(myRowViewDest), it); Kokkos::single(Kokkos::PerTeam(member), [=, *this]() { m_distancesView(myRowIndex) = resultDist; }); } // store result of checking if all members have their local // values matching the one stored in m_distancesView member.team_barrier(); const bool intraTeamCheck = team_members_have_matching_result( member, resultDist, m_distancesView(myRowIndex)); Kokkos::single(Kokkos::PerTeam(member), [=, *this]() { m_intraTeamSentinelView(myRowIndex) = intraTeamCheck; }); } }; template void test_A(std::size_t numTeams, std::size_t numCols, int apiId) { /* description: use a rank-2 view randomly filled with values, and run a team-level copy_if where only the values strictly greater than a threshold are copied into a new view */ const auto threshold = static_cast(151); // ----------------------------------------------- // prepare data // ----------------------------------------------- // create a view in the memory space associated with default exespace // with as many rows as the number of teams and fill it with random // values from an arbitrary range. auto [sourceView, sourceViewBeforeOp_h] = create_random_view_and_host_clone( LayoutTag{}, numTeams, numCols, Kokkos::pair{5, 523}, "sourceView"); // ----------------------------------------------- // launch kokkos kernel // ----------------------------------------------- using space_t = Kokkos::DefaultExecutionSpace; Kokkos::TeamPolicy policy(numTeams, Kokkos::AUTO()); // create the destination view Kokkos::View destView("destView", numTeams, numCols); // copy_if returns an iterator so to verify that it is correct // each team stores the distance of the returned iterator from the // beginning of the interval that team operates on and then we check // that these distances match the std result Kokkos::View distancesView("distancesView", numTeams); // sentinel to check if all members of the team compute the same result Kokkos::View intraTeamSentinelView("intraTeamSameResult", numTeams); // use CTAD for functor TestFunctorA fnc(sourceView, destView, distancesView, intraTeamSentinelView, threshold, apiId); Kokkos::parallel_for(policy, fnc); // ----------------------------------------------- // run cpp-std kernel and check // ----------------------------------------------- auto distancesView_h = create_host_space_copy(distancesView); auto intraTeamSentinelView_h = create_host_space_copy(intraTeamSentinelView); Kokkos::View stdDestView("stdDestView", numTeams, numCols); GreaterThanValueFunctor predicate(threshold); for (std::size_t i = 0; i < sourceView.extent(0); ++i) { auto rowFrom = Kokkos::subview(sourceViewBeforeOp_h, i, Kokkos::ALL()); auto rowDest = Kokkos::subview(stdDestView, i, Kokkos::ALL()); auto it = std::copy_if(KE::cbegin(rowFrom), KE::cend(rowFrom), KE::begin(rowDest), predicate); const std::size_t stdDistance = KE::distance(KE::begin(rowDest), it); ASSERT_EQ(stdDistance, distancesView_h(i)); ASSERT_TRUE(intraTeamSentinelView_h(i)); } auto dataViewAfterOp_h = create_host_space_copy(destView); expect_equal_host_views(stdDestView, dataViewAfterOp_h); } template void run_all_scenarios() { for (int numTeams : teamSizesToTest) { for (const auto& numCols : {0, 1, 2, 13, 101, 1444, 8153}) { for (int apiId : {0, 1}) { test_A(numTeams, numCols, apiId); } } } } TEST(std_algorithms_copy_if_team_test, test) { // FIXME_OPENMPTARGET #if defined(KOKKOS_ENABLE_OPENMPTARGET) && defined(KOKKOS_ARCH_INTEL_GPU) GTEST_SKIP() << "the test is known to fail with OpenMPTarget on Intel GPUs"; #endif run_all_scenarios(); run_all_scenarios(); run_all_scenarios(); } } // namespace TeamCopyIf } // namespace stdalgos } // namespace Test