| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173 |
- /* Copyright (C) 2013-2014 Povilas Kanapickas <[email protected]>
- Distributed under the Boost Software License, Version 1.0.
- (See accompanying file LICENSE_1_0.txt or copy at
- http://www.boost.org/LICENSE_1_0.txt)
- */
- #ifndef LIBSIMDPP_SIMDPP_CORE_CMP_EQ_H
- #define LIBSIMDPP_SIMDPP_CORE_CMP_EQ_H
- #ifndef LIBSIMDPP_SIMD_H
- #error "This file must be included through simd.h"
- #endif
- #include <simdpp/types.h>
- #include <simdpp/detail/insn/cmp_eq.h>
- #include <simdpp/core/detail/scalar_arg_impl.h>
- namespace simdpp {
- namespace SIMDPP_ARCH_NAMESPACE {
- /** Compares 8-bit values for equality.
- @code
- r0 = (a0 == b0) ? 0xff : 0x0
- ...
- rN = (aN == bN) ? 0xff : 0x0
- @endcode
- @par 256-bit version:
- @icost{SSE2-AVX, NEON, ALTIVEC, 2}
- */
- template<unsigned N, class V1, class V2> SIMDPP_INL
- mask_int8<N,expr_empty> cmp_eq(const any_int8<N,V1>& a,
- const any_int8<N,V2>& b)
- {
- typename detail::get_expr2_nosign<V1, V2>::type ra, rb;
- ra = a.wrapped().eval();
- rb = b.wrapped().eval();
- return detail::insn::i_cmp_eq(ra, rb);
- }
- SIMDPP_SCALAR_ARG_IMPL_VEC_EXPR(cmp_eq, mask_int8, any_int8)
- /** Compares 16-bit values for equality.
- @code
- r0 = (a0 == b0) ? 0xffff : 0x0
- ...
- rN = (aN == bN) ? 0xffff : 0x0
- @endcode
- @par 256-bit version:
- @icost{SSE2-AVX, NEON, ALTIVEC, 2}
- */
- template<unsigned N, class V1, class V2> SIMDPP_INL
- mask_int16<N,expr_empty> cmp_eq(const any_int16<N,V1>& a,
- const any_int16<N,V2>& b)
- {
- typename detail::get_expr2_nosign<V1, V2>::type ra, rb;
- ra = a.wrapped().eval();
- rb = b.wrapped().eval();
- return detail::insn::i_cmp_eq(ra, rb);
- }
- SIMDPP_SCALAR_ARG_IMPL_VEC_EXPR(cmp_eq, mask_int16, any_int16)
- /** Compares the values of two int32x4 vectors for equality
- @code
- r0 = (a0 == b0) ? 0xffffffff : 0x0
- ...
- rN = (aN == bN) ? 0xffffffff : 0x0
- @endcode
- @par 256-bit version:
- @icost{SSE2-AVX, NEON, ALTIVEC, 2}
- */
- template<unsigned N, class V1, class V2> SIMDPP_INL
- mask_int32<N,expr_empty> cmp_eq(const any_int32<N,V1>& a,
- const any_int32<N,V2>& b)
- {
- typename detail::get_expr2_nosign<V1, V2>::type ra, rb;
- ra = a.wrapped().eval();
- rb = b.wrapped().eval();
- return detail::insn::i_cmp_eq(ra, rb);
- }
- SIMDPP_SCALAR_ARG_IMPL_VEC_EXPR(cmp_eq, mask_int32, any_int32)
- /** Compares the values of two int64x2 vectors for equality
- @code
- r0 = (a0 == b0) ? 0xffffffffffffffff : 0x0
- ...
- rN = (aN == bN) ? 0xffffffffffffffff : 0x0
- @endcode
- @par 128-bit version:
- @icost{SSE2-SSSE3, 5}
- @icost{XOP, 1}
- @icost{NEON, 3}
- @icost{ALTIVEC, 3-4}
- @par 256-bit version:
- @icost{SSE2-SSSE3, AVX, 10}
- @icost{XOP, SSE4.1, 2}
- @icost{NEON, 6}
- @icost{ALTIVEC, 6-7}
- */
- template<unsigned N, class V1, class V2> SIMDPP_INL
- mask_int64<N,expr_empty> cmp_eq(const any_int64<N,V1>& a,
- const any_int64<N,V2>& b)
- {
- typename detail::get_expr2_nosign<V1, V2>::type ra, rb;
- ra = a.wrapped().eval();
- rb = b.wrapped().eval();
- return detail::insn::i_cmp_eq(ra, rb);
- }
- SIMDPP_SCALAR_ARG_IMPL_VEC_EXPR(cmp_eq, mask_int64, any_int64)
- /** Compares the values of two float32x4 vectors for equality
- @code
- r0 = (a0 == b0) ? 0xffffffff : 0x0
- ...
- rN = (aN == bN) ? 0xffffffff : 0x0
- @endcode
- @par 256-bit version:
- @icost{SSE2-SSE4.1, NEON, ALTIVEC, 2}
- */
- template<unsigned N, class V1, class V2> SIMDPP_INL
- mask_float32<N,expr_empty> cmp_eq(const any_float32<N,V1>& a,
- const any_float32<N,V2>& b)
- {
- return detail::insn::i_cmp_eq(a.wrapped().eval(), b.wrapped().eval());
- }
- SIMDPP_SCALAR_ARG_IMPL_VEC_EXPR(cmp_eq, mask_float32, any_float32)
- /** Compares the values of two float64x2 vectors for equality
- @code
- r0 = (a0 == b0) ? 0xffffffffffffffff : 0x0
- ...
- rN = (aN == bN) ? 0xffffffffffffffff : 0x0
- @endcode
- @par 128-bit version:
- @novec{NEON, ALTIVEC}
- @par 256-bit version:
- @novec{NEON, ALTIVEC}
- @icost{SSE2-SSE4.1, 2}
- */
- template<unsigned N, class V1, class V2> SIMDPP_INL
- mask_float64<N,expr_empty> cmp_eq(const any_float64<N,V1>& a,
- const any_float64<N,V2>& b)
- {
- return detail::insn::i_cmp_eq(a.wrapped().eval(), b.wrapped().eval());
- }
- SIMDPP_SCALAR_ARG_IMPL_VEC_EXPR(cmp_eq, mask_float64, any_float64)
- } // namespace SIMDPP_ARCH_NAMESPACE
- } // namespace simdpp
- #endif
|