0
0
Fork 0
mirror of https://github.com/matrix-construct/construct synced 2024-12-26 15:33:54 +01:00

ircd::simd: Use template as basis for unaligned wrapper; simplify suite.

ircd::simd: Rename unaligned header.
This commit is contained in:
Jason Volk 2020-10-06 17:42:06 -07:00
parent e69ad0b49a
commit 112151249b
3 changed files with 94 additions and 112 deletions

View file

@ -12,7 +12,7 @@
#define HAVE_IRCD_SIMD_H
#include "type.h"
#include "type.unaligned.h"
#include "unaligned.h"
#include "traits.h"
#include "lane_cast.h"
#include "broad_cast.h"

View file

@ -1,111 +0,0 @@
// The Construct
//
// Copyright (C) The Construct Developers, Authors & Contributors
// Copyright (C) 2016-2020 Jason Volk <jason@zemos.net>
//
// Permission to use, copy, modify, and/or distribute this software for any
// purpose with or without fee is hereby granted, provided that the above
// copyright notice and this permission notice is present in all copies. The
// full license for this software is available in the LICENSE file.
#pragma once
#define HAVE_IRCD_SIMD_TYPE_UNALIGNED_H
#pragma GCC diagnostic push
#pragma GCC diagnostic ignored "-Wpsabi"
#pragma GCC diagnostic ignored "-Wpacked"
/// Unaligned type wrapper macro
#define IRCD_SIMD_TYPEDEF_UNALIGNED(TYPE, NAME) \
struct \
__attribute__((packed)) \
__attribute__((aligned(1))) \
__attribute__((visibility("internal"))) \
NAME \
{ \
using value_type = TYPE; \
\
TYPE val; \
\
operator TYPE() const { return val; } \
\
template<class T> NAME &operator=(T&& t) \
{ \
val = std::forward<T>(t); \
return *this; \
} \
}
//
// unsigned
//
namespace ircd::simd
{
IRCD_SIMD_TYPEDEF_UNALIGNED(m512i, u512x1_u);
IRCD_SIMD_TYPEDEF_UNALIGNED(m256i, u256x1_u);
IRCD_SIMD_TYPEDEF_UNALIGNED(m128i, u128x1_u);
}
namespace ircd
{
using simd::u512x1_u;
using simd::u256x1_u;
using simd::u128x1_u;
}
//
// signed
//
namespace ircd::simd
{
IRCD_SIMD_TYPEDEF_UNALIGNED(m512i, i512x1_u);
IRCD_SIMD_TYPEDEF_UNALIGNED(m256i, i256x1_u);
IRCD_SIMD_TYPEDEF_UNALIGNED(m128i, i128x1_u);
}
namespace ircd
{
using simd::i512x1_u;
using simd::i256x1_u;
using simd::i128x1_u;
}
//
// single precision
//
namespace ircd::simd
{
IRCD_SIMD_TYPEDEF_UNALIGNED(m512f, f512x1_u);
IRCD_SIMD_TYPEDEF_UNALIGNED(m256f, f256x1_u);
IRCD_SIMD_TYPEDEF_UNALIGNED(m128f, f128x1_u);
}
namespace ircd
{
using simd::f512x1_u;
using simd::f256x1_u;
using simd::f128x1_u;
}
//
// double precision
//
namespace ircd::simd
{
IRCD_SIMD_TYPEDEF_UNALIGNED(m512d, d512x1_u);
IRCD_SIMD_TYPEDEF_UNALIGNED(m256d, d256x1_u);
IRCD_SIMD_TYPEDEF_UNALIGNED(m128d, d128x1_u);
}
namespace ircd
{
using simd::d512x1_u;
using simd::d256x1_u;
using simd::d128x1_u;
}
#pragma GCC diagnostic pop

View file

@ -0,0 +1,93 @@
// The Construct
//
// Copyright (C) The Construct Developers, Authors & Contributors
// Copyright (C) 2016-2020 Jason Volk <jason@zemos.net>
//
// Permission to use, copy, modify, and/or distribute this software for any
// purpose with or without fee is hereby granted, provided that the above
// copyright notice and this permission notice is present in all copies. The
// full license for this software is available in the LICENSE file.
#pragma once
#define HAVE_IRCD_SIMD_TYPE_UNALIGNED_H
#pragma GCC diagnostic push
#pragma GCC diagnostic ignored "-Wpsabi"
#pragma GCC diagnostic ignored "-Wpacked"
namespace ircd::simd
{
template<class T> struct unaligned;
}
/// Unaligned wrapper template class.
/// T = inner aligned type
template<class T>
struct
__attribute__((packed))
__attribute__((aligned(1)))
__attribute__((visibility("internal")))
ircd::simd::unaligned
{
using value_type = T;
T val;
operator T() const
{
return val;
}
template<class U>
unaligned(U&& val)
:val(std::forward<U>(val))
{}
};
/// Unaligned type wrapper macro. We use this macro to define several common
/// instantiations of unaligned<T>.
///
#define IRCD_SIMD_TYPEDEF_UNALIGNED(TYPE, NAME) \
namespace ircd \
{ \
namespace simd \
{ \
using NAME = unaligned<TYPE>; \
} \
\
using simd::NAME; \
}
//
// unsigned
//
IRCD_SIMD_TYPEDEF_UNALIGNED(m512i, u512x1_u);
IRCD_SIMD_TYPEDEF_UNALIGNED(m256i, u256x1_u);
IRCD_SIMD_TYPEDEF_UNALIGNED(m128i, u128x1_u);
//
// signed
//
IRCD_SIMD_TYPEDEF_UNALIGNED(m512i, i512x1_u);
IRCD_SIMD_TYPEDEF_UNALIGNED(m256i, i256x1_u);
IRCD_SIMD_TYPEDEF_UNALIGNED(m128i, i128x1_u);
//
// single precision
//
IRCD_SIMD_TYPEDEF_UNALIGNED(m512f, f512x1_u);
IRCD_SIMD_TYPEDEF_UNALIGNED(m256f, f256x1_u);
IRCD_SIMD_TYPEDEF_UNALIGNED(m128f, f128x1_u);
//
// double precision
//
IRCD_SIMD_TYPEDEF_UNALIGNED(m512d, d512x1_u);
IRCD_SIMD_TYPEDEF_UNALIGNED(m256d, d256x1_u);
IRCD_SIMD_TYPEDEF_UNALIGNED(m128d, d128x1_u);
#pragma GCC diagnostic pop