// The Construct // // Copyright (C) The Construct Developers, Authors & Contributors // Copyright (C) 2016-2020 Jason Volk // // Permission to use, copy, modify, and/or distribute this software for any // purpose with or without fee is hereby granted, provided that the above // copyright notice and this permission notice is present in all copies. The // full license for this software is available in the LICENSE file. #pragma once #define HAVE_IRCD_SIMD_SHR_H // xmmx shift-right interface namespace ircd::simd { template T _shr(const T) noexcept; template typename std::enable_if::type shr(const T a) noexcept; template typename std::enable_if::type shr(const T a) noexcept; template typename std::enable_if::type shr(const T a) noexcept; } template [[using gnu: always_inline, gnu_inline, artificial]] extern inline T ircd::simd::_shr(const T a) noexcept { static_assert ( sizeof(T) == sizeof(V) ); static_assert ( b % 8 == 0, "[emulated] xmmx register only shifts right at bytewise resolution." ); constexpr int B { b / 8 }; V arg(a), ret(a); for(size_t i(0); i < sizeof(V) - B; ++i) ret[i] = arg[i + B]; for(size_t i(sizeof(V) - B); i < sizeof(V); ++i) ret[i] = 0; return T(ret); } #if defined(HAVE_X86INTRIN_H) && defined(__SSE2__) template [[using gnu: always_inline, gnu_inline, artificial]] extern inline typename std::enable_if::type ircd::simd::shr(const T a) noexcept { static_assert ( b % 8 == 0, "xmmx register only shifts right at bytewise resolution." ); return T(_mm_bsrli_si128(u128x1(a), b / 8)); } #else template [[using gnu: always_inline, gnu_inline, artificial]] extern inline typename std::enable_if::type ircd::simd::shr(const T a) noexcept { return _shr(a); } #endif #if defined(HAVE_X86INTRIN_H) && defined(__AVX2__) template [[using gnu: always_inline, gnu_inline, artificial]] extern inline typename std::enable_if::type ircd::simd::shr(const T a) noexcept { static_assert ( b % 8 == 0, "ymmx register only shifts right at bytewise resolution." ); return T(_mm256_srli_si256(u256x1(a), b / 8)); } #else template [[using gnu: always_inline, gnu_inline, artificial]] extern inline typename std::enable_if::type ircd::simd::shr(const T a) noexcept { return _shr(a); } #endif template [[using gnu: always_inline, gnu_inline, artificial]] extern inline typename std::enable_if::type ircd::simd::shr(const T a) noexcept { return _shr(a); }