123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590 |
- // Do not include this header directly.
- // Control flow functionality in common between all the headers.
- //
- // Copyright 2020-2021 Binomial LLC
- //
- // Licensed under the Apache License, Version 2.0 (the "License");
- // you may not use this file except in compliance with the License.
- // You may obtain a copy of the License at
- //
- // http://www.apache.org/licenses/LICENSE-2.0
- //
- // Unless required by applicable law or agreed to in writing, software
- // distributed under the License is distributed on an "AS IS" BASIS,
- // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- // See the License for the specific language governing permissions and
- // limitations under the License.
- #ifdef _DEBUG
- CPPSPMD_FORCE_INLINE void spmd_kernel::check_masks()
- {
- assert(!any(andnot(m_kernel_exec, m_exec)));
- }
- #endif
- CPPSPMD_FORCE_INLINE void spmd_kernel::spmd_break()
- {
- #ifdef _DEBUG
- assert(m_in_loop);
- #endif
- m_exec = exec_mask::all_off();
- }
- CPPSPMD_FORCE_INLINE void spmd_kernel::spmd_continue()
- {
- #ifdef _DEBUG
- assert(m_in_loop);
- #endif
- // Kill any active lanes, and remember which lanes were active so we can re-enable them at the end of the loop body.
- m_continue_mask = m_continue_mask | m_exec;
- m_exec = exec_mask::all_off();
- }
- CPPSPMD_FORCE_INLINE void spmd_kernel::spmd_return()
- {
- // Permenantly kill all active lanes
- m_kernel_exec = andnot(m_exec, m_kernel_exec);
- m_exec = exec_mask::all_off();
- }
-
- template<typename UnmaskedBody>
- CPPSPMD_FORCE_INLINE void spmd_kernel::spmd_unmasked(const UnmaskedBody& unmaskedBody)
- {
- exec_mask orig_exec = m_exec, orig_kernel_exec = m_kernel_exec;
- m_kernel_exec = exec_mask::all_on();
- m_exec = exec_mask::all_on();
- unmaskedBody();
- m_kernel_exec = m_kernel_exec & orig_kernel_exec;
- m_exec = m_exec & orig_exec;
-
- check_masks();
- }
- struct scoped_unmasked_restorer
- {
- spmd_kernel *m_pKernel;
- exec_mask m_orig_exec, m_orig_kernel_exec;
-
- CPPSPMD_FORCE_INLINE scoped_unmasked_restorer(spmd_kernel *pKernel) :
- m_pKernel(pKernel),
- m_orig_exec(pKernel->m_exec),
- m_orig_kernel_exec(pKernel->m_kernel_exec)
- {
- pKernel->m_kernel_exec = exec_mask::all_on();
- pKernel->m_exec = exec_mask::all_on();
- }
- CPPSPMD_FORCE_INLINE ~scoped_unmasked_restorer()
- {
- m_pKernel->m_kernel_exec = m_pKernel->m_kernel_exec & m_orig_kernel_exec;
- m_pKernel->m_exec = m_pKernel->m_exec & m_orig_exec;
- m_pKernel->check_masks();
- }
- };
- #define SPMD_UNMASKED_BEGIN { scoped_unmasked_restorer _unmasked_restorer(this);
- #define SPMD_UNMASKED_END }
- #if 0
- template<typename SPMDKernel, typename... Args>
- CPPSPMD_FORCE_INLINE decltype(auto) spmd_kernel::spmd_call(Args&&... args)
- {
- SPMDKernel kernel;
- kernel.init(m_exec);
- return kernel._call(std::forward<Args>(args)...);
- }
- #else
- template<typename SPMDKernel, typename... Args>
- CPPSPMD_FORCE_INLINE void spmd_kernel::spmd_call(Args&&... args)
- {
- SPMDKernel kernel;
- kernel.init(m_exec);
- kernel._call(std::forward<Args>(args)...);
- }
- #endif
- CPPSPMD_FORCE_INLINE void spmd_kernel::spmd_if_break(const vbool& cond)
- {
- #ifdef _DEBUG
- assert(m_in_loop);
- #endif
-
- exec_mask cond_exec(cond);
-
- m_exec = andnot(m_exec & cond_exec, m_exec);
- check_masks();
- }
- // No SPMD breaks, continues, etc. allowed
- template<typename IfBody>
- CPPSPMD_FORCE_INLINE void spmd_kernel::spmd_sif(const vbool& cond, const IfBody& ifBody)
- {
- exec_mask im = m_exec & exec_mask(cond);
- if (any(im))
- {
- const exec_mask orig_exec = m_exec;
- m_exec = im;
- ifBody();
- m_exec = orig_exec;
- }
- }
- // No SPMD breaks, continues, etc. allowed
- template<typename IfBody, typename ElseBody>
- CPPSPMD_FORCE_INLINE void spmd_kernel::spmd_sifelse(const vbool& cond, const IfBody& ifBody, const ElseBody &elseBody)
- {
- const exec_mask orig_exec = m_exec;
- exec_mask im = m_exec & exec_mask(cond);
- if (any(im))
- {
- m_exec = im;
- ifBody();
- }
- exec_mask em = orig_exec & exec_mask(!cond);
- if (any(em))
- {
- m_exec = em;
- elseBody();
- }
-
- m_exec = orig_exec;
- }
- template<typename IfBody>
- CPPSPMD_FORCE_INLINE void spmd_kernel::spmd_if(const vbool& cond, const IfBody& ifBody)
- {
- exec_mask cond_exec(cond);
-
- exec_mask pre_if_exec = cond_exec & m_exec;
- if (any(pre_if_exec))
- {
- exec_mask unexecuted_lanes = andnot(cond_exec, m_exec);
- m_exec = pre_if_exec;
- ifBody();
- // Propagate any lanes that got disabled inside the if body into the exec mask outside the if body, but turn on any lanes that didn't execute inside the if body.
- m_exec = m_exec | unexecuted_lanes;
- check_masks();
- }
- }
- template<typename IfBody, typename ElseBody>
- CPPSPMD_FORCE_INLINE void spmd_kernel::spmd_ifelse(const vbool& cond, const IfBody& ifBody, const ElseBody& elseBody)
- {
- bool all_flag = false;
- exec_mask cond_exec(cond);
-
- {
- exec_mask pre_if_exec = cond_exec & m_exec;
- int mask = pre_if_exec.get_movemask();
- if (mask != 0)
- {
- all_flag = ((uint32_t)mask == m_exec.get_movemask());
- exec_mask unexecuted_lanes = andnot(cond_exec, m_exec);
- m_exec = pre_if_exec;
- ifBody();
- // Propagate any lanes that got disabled inside the if body into the exec mask outside the if body, but turn on any lanes that didn't execute inside the if body.
- m_exec = m_exec | unexecuted_lanes;
- check_masks();
- }
- }
- if (!all_flag)
- {
- exec_mask pre_if_exec = andnot(cond_exec, m_exec);
- if (any(pre_if_exec))
- {
- exec_mask unexecuted_lanes = cond_exec & m_exec;
- m_exec = pre_if_exec;
- ifBody();
- // Propagate any lanes that got disabled inside the if body into the exec mask outside the if body, but turn on any lanes that didn't execute inside the if body.
- m_exec = m_exec | unexecuted_lanes;
- check_masks();
- }
- }
- }
- struct scoped_exec_restorer
- {
- exec_mask *m_pMask;
- exec_mask m_prev_mask;
- CPPSPMD_FORCE_INLINE scoped_exec_restorer(exec_mask *pExec_mask) : m_pMask(pExec_mask), m_prev_mask(*pExec_mask) { }
- CPPSPMD_FORCE_INLINE ~scoped_exec_restorer() { *m_pMask = m_prev_mask; }
- };
- // Cannot use SPMD break, continue, or return inside "simple" if/else
- #define SPMD_SIF(cond) exec_mask CPPSPMD_GLUER2(_exec_temp, __LINE__)(m_exec & exec_mask(vbool(cond))); if (any(CPPSPMD_GLUER2(_exec_temp, __LINE__))) \
- { CPPSPMD::scoped_exec_restorer CPPSPMD_GLUER2(_exec_restore_, __LINE__)(&m_exec); m_exec = CPPSPMD_GLUER2(_exec_temp, __LINE__);
- #define SPMD_SELSE(cond) } exec_mask CPPSPMD_GLUER2(_exec_temp, __LINE__)(m_exec & exec_mask(!vbool(cond))); if (any(CPPSPMD_GLUER2(_exec_temp, __LINE__))) \
- { CPPSPMD::scoped_exec_restorer CPPSPMD_GLUER2(_exec_restore_, __LINE__)(&m_exec); m_exec = CPPSPMD_GLUER2(_exec_temp, __LINE__);
- #define SPMD_SENDIF }
- // Same as SPMD_SIF, except doesn't use a scoped object
- #define SPMD_SIF2(cond) exec_mask CPPSPMD_GLUER2(_exec_temp, __LINE__)(m_exec & exec_mask(vbool(cond))); if (any(CPPSPMD_GLUER2(_exec_temp, __LINE__))) \
- { exec_mask _orig_exec = m_exec; m_exec = CPPSPMD_GLUER2(_exec_temp, __LINE__);
- #define SPMD_SELSE2(cond) m_exec = _orig_exec; } exec_mask CPPSPMD_GLUER2(_exec_temp, __LINE__)(m_exec & exec_mask(!vbool(cond))); if (any(CPPSPMD_GLUER2(_exec_temp, __LINE__))) \
- { exec_mask _orig_exec = m_exec; m_exec = CPPSPMD_GLUER2(_exec_temp, __LINE__);
- #define SPMD_SEND_IF2 m_exec = _orig_exec; }
- // Same as SPMD_SIF(), except the if/else blocks are always executed
- #define SPMD_SAIF(cond) exec_mask CPPSPMD_GLUER2(_exec_temp, __LINE__)(m_exec & exec_mask(vbool(cond))); { CPPSPMD::scoped_exec_restorer CPPSPMD_GLUER2(_exec_restore_, __LINE__)(&m_exec); \
- m_exec = CPPSPMD_GLUER2(_exec_temp, __LINE__);
- #define SPMD_SAELSE(cond) } exec_mask CPPSPMD_GLUER2(_exec_temp, __LINE__)(m_exec & exec_mask(!vbool(cond))); { CPPSPMD::scoped_exec_restorer CPPSPMD_GLUER2(_exec_restore_, __LINE__)(&m_exec); \
- m_exec = CPPSPMD_GLUER2(_exec_temp, __LINE__);
- #define SPMD_SAENDIF }
- // Cannot use SPMD break, continue, or return inside sselect
- #define SPMD_SSELECT(var) do { vint_t _select_var = var; scoped_exec_restorer _orig_exec(&m_exec); exec_mask _select_executed(exec_mask::all_off());
- #define SPMD_SCASE(value) exec_mask CPPSPMD_GLUER2(_exec_temp, __LINE__)(_orig_exec.m_prev_mask & exec_mask(vbool(_select_var == (value)))); if (any(CPPSPMD_GLUER2(_exec_temp, __LINE__))) \
- { m_exec = CPPSPMD_GLUER2(_exec_temp, __LINE__); _select_executed = _select_executed | m_exec;
- //#define SPMD_SCASE_END if (_select_executed.get_movemask() == _orig_exec.m_prev_mask.get_movemask()) break; }
- #define SPMD_SCASE_END if (!any(_select_executed ^ _orig_exec.m_prev_mask)) break; }
- #define SPMD_SDEFAULT exec_mask _all_other_lanes(andnot(_select_executed, _orig_exec.m_prev_mask)); if (any(_all_other_lanes)) { m_exec = _all_other_lanes;
- #define SPMD_SDEFAULT_END }
- #define SPMD_SSELECT_END } while(0);
- // Same as SPMD_SSELECT, except all cases are executed.
- // Cannot use SPMD break, continue, or return inside sselect
- #define SPMD_SASELECT(var) do { vint_t _select_var = var; scoped_exec_restorer _orig_exec(&m_exec); exec_mask _select_executed(exec_mask::all_off());
- #define SPMD_SACASE(value) exec_mask CPPSPMD_GLUER2(_exec_temp, __LINE__)(_orig_exec.m_prev_mask & exec_mask(vbool(_select_var == (value)))); { m_exec = CPPSPMD_GLUER2(_exec_temp, __LINE__); \
- _select_executed = _select_executed | m_exec;
- #define SPMD_SACASE_END }
- #define SPMD_SADEFAULT exec_mask _all_other_lanes(andnot(_select_executed, _orig_exec.m_prev_mask)); { m_exec = _all_other_lanes;
- #define SPMD_SADEFAULT_END }
- #define SPMD_SASELECT_END } while(0);
- struct scoped_exec_restorer2
- {
- spmd_kernel *m_pKernel;
- exec_mask m_unexecuted_lanes;
-
- CPPSPMD_FORCE_INLINE scoped_exec_restorer2(spmd_kernel *pKernel, const vbool &cond) :
- m_pKernel(pKernel)
- {
- exec_mask cond_exec(cond);
- m_unexecuted_lanes = andnot(cond_exec, pKernel->m_exec);
- pKernel->m_exec = cond_exec & pKernel->m_exec;
- }
- CPPSPMD_FORCE_INLINE ~scoped_exec_restorer2()
- {
- m_pKernel->m_exec = m_pKernel->m_exec | m_unexecuted_lanes;
- m_pKernel->check_masks();
- }
- };
- #define SPMD_IF(cond) { CPPSPMD::scoped_exec_restorer2 CPPSPMD_GLUER2(_exec_restore2_, __LINE__)(this, vbool(cond)); if (any(m_exec)) {
- #define SPMD_ELSE(cond) } } { CPPSPMD::scoped_exec_restorer2 CPPSPMD_GLUER2(_exec_restore2_, __LINE__)(this, !vbool(cond)); if (any(m_exec)) {
- #define SPMD_END_IF } }
- // Same as SPMD_IF, except the conditional block is always executed.
- #define SPMD_AIF(cond) { CPPSPMD::scoped_exec_restorer2 CPPSPMD_GLUER2(_exec_restore2_, __LINE__)(this, vbool(cond)); {
- #define SPMD_AELSE(cond) } } { CPPSPMD::scoped_exec_restorer2 CPPSPMD_GLUER2(_exec_restore2_, __LINE__)(this, !vbool(cond)); {
- #define SPMD_AEND_IF } }
- class scoped_exec_saver
- {
- exec_mask m_exec, m_kernel_exec, m_continue_mask;
- spmd_kernel *m_pKernel;
- #ifdef _DEBUG
- bool m_in_loop;
- #endif
- public:
- inline scoped_exec_saver(spmd_kernel *pKernel) :
- m_exec(pKernel->m_exec), m_kernel_exec(pKernel->m_kernel_exec), m_continue_mask(pKernel->m_continue_mask),
- m_pKernel(pKernel)
- {
- #ifdef _DEBUG
- m_in_loop = pKernel->m_in_loop;
- #endif
- }
-
- inline ~scoped_exec_saver()
- {
- m_pKernel->m_exec = m_exec;
- m_pKernel->m_continue_mask = m_continue_mask;
- m_pKernel->m_kernel_exec = m_kernel_exec;
- #ifdef _DEBUG
- m_pKernel->m_in_loop = m_in_loop;
- m_pKernel->check_masks();
- #endif
- }
- };
- #define SPMD_BEGIN_CALL scoped_exec_saver CPPSPMD_GLUER2(_begin_call_scoped_exec_saver, __LINE__)(this); m_continue_mask = exec_mask::all_off();
- #define SPMD_BEGIN_CALL_ALL_LANES scoped_exec_saver CPPSPMD_GLUER2(_begin_call_scoped_exec_saver, __LINE__)(this); m_exec = exec_mask::all_on(); m_continue_mask = exec_mask::all_off();
- template<typename ForeachBody>
- CPPSPMD_FORCE_INLINE void spmd_kernel::spmd_foreach(int begin, int end, const ForeachBody& foreachBody)
- {
- if (begin == end)
- return;
-
- if (!any(m_exec))
- return;
- // We don't support iterating backwards.
- if (begin > end)
- std::swap(begin, end);
- exec_mask prev_continue_mask = m_continue_mask, prev_exec = m_exec;
-
- int total_full = (end - begin) / PROGRAM_COUNT;
- int total_partial = (end - begin) % PROGRAM_COUNT;
- lint_t loop_index = begin + program_index;
-
- const int total_loops = total_full + (total_partial ? 1 : 0);
- m_continue_mask = exec_mask::all_off();
- for (int i = 0; i < total_loops; i++)
- {
- int n = PROGRAM_COUNT;
- if ((i == (total_loops - 1)) && (total_partial))
- {
- exec_mask partial_mask = exec_mask(vint_t(total_partial) > vint_t(program_index));
- m_exec = m_exec & partial_mask;
- n = total_partial;
- }
- foreachBody(loop_index, n);
- m_exec = m_exec | m_continue_mask;
- if (!any(m_exec))
- break;
- m_continue_mask = exec_mask::all_off();
- check_masks();
-
- store_all(loop_index, loop_index + PROGRAM_COUNT);
- }
- m_exec = prev_exec & m_kernel_exec;
- m_continue_mask = prev_continue_mask;
- check_masks();
- }
- template<typename WhileCondBody, typename WhileBody>
- CPPSPMD_FORCE_INLINE void spmd_kernel::spmd_while(const WhileCondBody& whileCondBody, const WhileBody& whileBody)
- {
- exec_mask orig_exec = m_exec;
- exec_mask orig_continue_mask = m_continue_mask;
- m_continue_mask = exec_mask::all_off();
- #ifdef _DEBUG
- const bool prev_in_loop = m_in_loop;
- m_in_loop = true;
- #endif
- while(true)
- {
- exec_mask cond_exec = exec_mask(whileCondBody());
- m_exec = m_exec & cond_exec;
- if (!any(m_exec))
- break;
- whileBody();
- m_exec = m_exec | m_continue_mask;
- m_continue_mask = exec_mask::all_off();
- check_masks();
- }
- #ifdef _DEBUG
- m_in_loop = prev_in_loop;
- #endif
- m_exec = orig_exec & m_kernel_exec;
- m_continue_mask = orig_continue_mask;
- check_masks();
- }
- struct scoped_while_restorer
- {
- spmd_kernel *m_pKernel;
- exec_mask m_orig_exec, m_orig_continue_mask;
- #ifdef _DEBUG
- bool m_prev_in_loop;
- #endif
-
- CPPSPMD_FORCE_INLINE scoped_while_restorer(spmd_kernel *pKernel) :
- m_pKernel(pKernel),
- m_orig_exec(pKernel->m_exec),
- m_orig_continue_mask(pKernel->m_continue_mask)
- {
- pKernel->m_continue_mask.all_off();
- #ifdef _DEBUG
- m_prev_in_loop = pKernel->m_in_loop;
- pKernel->m_in_loop = true;
- #endif
- }
- CPPSPMD_FORCE_INLINE ~scoped_while_restorer()
- {
- m_pKernel->m_exec = m_orig_exec & m_pKernel->m_kernel_exec;
- m_pKernel->m_continue_mask = m_orig_continue_mask;
- #ifdef _DEBUG
- m_pKernel->m_in_loop = m_prev_in_loop;
- m_pKernel->check_masks();
- #endif
- }
- };
- #undef SPMD_WHILE
- #undef SPMD_WEND
- #define SPMD_WHILE(cond) { scoped_while_restorer CPPSPMD_GLUER2(_while_restore_, __LINE__)(this); while(true) { exec_mask CPPSPMD_GLUER2(cond_exec, __LINE__) = exec_mask(vbool(cond)); \
- m_exec = m_exec & CPPSPMD_GLUER2(cond_exec, __LINE__); if (!any(m_exec)) break;
- #define SPMD_WEND m_exec = m_exec | m_continue_mask; m_continue_mask = exec_mask::all_off(); check_masks(); } }
- // Nesting is not supported (although it will compile, but the results won't make much sense).
- #define SPMD_FOREACH(loop_var, bi, ei) if (((bi) != (ei)) && (any(m_exec))) { \
- scoped_while_restorer CPPSPMD_GLUER2(_while_restore_, __LINE__)(this); \
- uint32_t b = (uint32_t)(bi), e = (uint32_t)(ei); if ((b) > (e)) { std::swap(b, e); } const uint32_t total_full = ((e) - (b)) >> PROGRAM_COUNT_SHIFT, total_partial = ((e) - (b)) & (PROGRAM_COUNT - 1); \
- lint_t loop_var = program_index + (int)b; const uint32_t total_loops = total_full + (total_partial ? 1U : 0U); \
- for (uint32_t CPPSPMD_GLUER2(_foreach_counter, __LINE__) = 0; CPPSPMD_GLUER2(_foreach_counter, __LINE__) < total_loops; ++CPPSPMD_GLUER2(_foreach_counter, __LINE__)) { \
- if ((CPPSPMD_GLUER2(_foreach_counter, __LINE__) == (total_loops - 1)) && (total_partial)) { exec_mask partial_mask = exec_mask(vint_t((int)total_partial) > vint_t(program_index)); m_exec = m_exec & partial_mask; }
- #define SPMD_FOREACH_END(loop_var) m_exec = m_exec | m_continue_mask; if (!any(m_exec)) break; m_continue_mask = exec_mask::all_off(); check_masks(); store_all(loop_var, loop_var + PROGRAM_COUNT); } }
- // Okay to use spmd_continue or spmd_return, but not spmd_break
- #define SPMD_FOREACH_ACTIVE(index_var) int64_t index_var; { uint64_t _movemask = m_exec.get_movemask(); if (_movemask) { scoped_while_restorer CPPSPMD_GLUER2(_while_restore_, __LINE__)(this); \
- for (uint32_t _i = 0; _i < PROGRAM_COUNT; ++_i) { \
- if (_movemask & (1U << _i)) { \
- m_exec.enable_lane(_i); m_exec = m_exec & m_kernel_exec; \
- (index_var) = _i; \
- #define SPMD_FOREACH_ACTIVE_END } } } }
- // Okay to use spmd_continue, but not spmd_break/spmd_continue
- #define SPMD_FOREACH_UNIQUE_INT(index_var, var) { scoped_while_restorer CPPSPMD_GLUER2(_while_restore_, __LINE__)(this); \
- CPPSPMD_DECL(int_t, _vals[PROGRAM_COUNT]); store_linear_all(_vals, var); std::sort(_vals, _vals + PROGRAM_COUNT); \
- const int _n = (int)(std::unique(_vals, _vals + PROGRAM_COUNT) - _vals); \
- for (int _i = 0; _i < _n; ++_i) { int index_var = _vals[_i]; vbool cond = (vint_t(var) == vint_t(index_var)); m_exec = exec_mask(cond);
- #define SPMD_FOREACH_UNIQUE_INT_END } }
- struct scoped_simple_while_restorer
- {
- spmd_kernel* m_pKernel;
- exec_mask m_orig_exec;
- #ifdef _DEBUG
- bool m_prev_in_loop;
- #endif
- CPPSPMD_FORCE_INLINE scoped_simple_while_restorer(spmd_kernel* pKernel) :
- m_pKernel(pKernel),
- m_orig_exec(pKernel->m_exec)
- {
-
- #ifdef _DEBUG
- m_prev_in_loop = pKernel->m_in_loop;
- pKernel->m_in_loop = true;
- #endif
- }
- CPPSPMD_FORCE_INLINE ~scoped_simple_while_restorer()
- {
- m_pKernel->m_exec = m_orig_exec;
- #ifdef _DEBUG
- m_pKernel->m_in_loop = m_prev_in_loop;
- m_pKernel->check_masks();
- #endif
- }
- };
- // Cannot use SPMD break, continue, or return inside simple while
- #define SPMD_SWHILE(cond) { scoped_simple_while_restorer CPPSPMD_GLUER2(_while_restore_, __LINE__)(this); \
- while(true) { \
- exec_mask CPPSPMD_GLUER2(cond_exec, __LINE__) = exec_mask(vbool(cond)); m_exec = m_exec & CPPSPMD_GLUER2(cond_exec, __LINE__); if (!any(m_exec)) break;
- #define SPMD_SWEND } }
- // Cannot use SPMD break, continue, or return inside simple do
- #define SPMD_SDO { scoped_simple_while_restorer CPPSPMD_GLUER2(_while_restore_, __LINE__)(this); while(true) {
- #define SPMD_SEND_DO(cond) exec_mask CPPSPMD_GLUER2(cond_exec, __LINE__) = exec_mask(vbool(cond)); m_exec = m_exec & CPPSPMD_GLUER2(cond_exec, __LINE__); if (!any(m_exec)) break; } }
- #undef SPMD_FOR
- #undef SPMD_END_FOR
- #define SPMD_FOR(for_init, for_cond) { for_init; scoped_while_restorer CPPSPMD_GLUER2(_while_restore_, __LINE__)(this); while(true) { exec_mask CPPSPMD_GLUER2(cond_exec, __LINE__) = exec_mask(vbool(for_cond)); \
- m_exec = m_exec & CPPSPMD_GLUER2(cond_exec, __LINE__); if (!any(m_exec)) break;
- #define SPMD_END_FOR(for_inc) m_exec = m_exec | m_continue_mask; m_continue_mask = exec_mask::all_off(); check_masks(); for_inc; } }
-
- template<typename ForInitBody, typename ForCondBody, typename ForIncrBody, typename ForBody>
- CPPSPMD_FORCE_INLINE void spmd_kernel::spmd_for(const ForInitBody& forInitBody, const ForCondBody& forCondBody, const ForIncrBody& forIncrBody, const ForBody& forBody)
- {
- exec_mask orig_exec = m_exec;
- forInitBody();
- exec_mask orig_continue_mask = m_continue_mask;
- m_continue_mask = exec_mask::all_off();
- #ifdef _DEBUG
- const bool prev_in_loop = m_in_loop;
- m_in_loop = true;
- #endif
- while(true)
- {
- exec_mask cond_exec = exec_mask(forCondBody());
- m_exec = m_exec & cond_exec;
- if (!any(m_exec))
- break;
- forBody();
- m_exec = m_exec | m_continue_mask;
- m_continue_mask = exec_mask::all_off();
- check_masks();
-
- forIncrBody();
- }
- m_exec = orig_exec & m_kernel_exec;
- m_continue_mask = orig_continue_mask;
- #ifdef _DEBUG
- m_in_loop = prev_in_loop;
- check_masks();
- #endif
- }
|