132 lines
3.8 KiB
C++
132 lines
3.8 KiB
C++
// Copyright 2009-2020 Intel Corporation
|
|
// SPDX-License-Identifier: Apache-2.0
|
|
|
|
#pragma once
|
|
|
|
#include "../sys/platform.h"
|
|
|
|
namespace embree
|
|
{
|
|
/* Varying numeric types */
|
|
template<int N>
|
|
struct vfloat
|
|
{
|
|
union { float f[N]; int i[N]; };
|
|
__forceinline const float& operator [](size_t index) const { assert(index < N); return f[index]; }
|
|
__forceinline float& operator [](size_t index) { assert(index < N); return f[index]; }
|
|
};
|
|
|
|
template<int N>
|
|
struct vdouble
|
|
{
|
|
union { double f[N]; long long i[N]; };
|
|
__forceinline const double& operator [](size_t index) const { assert(index < N); return f[index]; }
|
|
__forceinline double& operator [](size_t index) { assert(index < N); return f[index]; }
|
|
};
|
|
|
|
template<int N>
|
|
struct vint
|
|
{
|
|
int i[N];
|
|
__forceinline const int& operator [](size_t index) const { assert(index < N); return i[index]; }
|
|
__forceinline int& operator [](size_t index) { assert(index < N); return i[index]; }
|
|
};
|
|
|
|
template<int N>
|
|
struct vuint
|
|
{
|
|
unsigned int i[N];
|
|
__forceinline const unsigned int& operator [](size_t index) const { assert(index < N); return i[index]; }
|
|
__forceinline unsigned int& operator [](size_t index) { assert(index < N); return i[index]; }
|
|
};
|
|
|
|
template<int N>
|
|
struct vllong
|
|
{
|
|
long long i[N];
|
|
__forceinline const long long& operator [](size_t index) const { assert(index < N); return i[index]; }
|
|
__forceinline long long& operator [](size_t index) { assert(index < N); return i[index]; }
|
|
};
|
|
|
|
/* Varying bool types */
|
|
template<int N> struct vboolf { int i[N]; }; // for float/int
|
|
template<int N> struct vboold { long long i[N]; }; // for double/long long
|
|
|
|
/* Aliases to default types */
|
|
template<int N> using vreal = vfloat<N>;
|
|
template<int N> using vbool = vboolf<N>;
|
|
|
|
/* Varying size constants */
|
|
#if defined(__AVX512VL__) // SKX
|
|
const int VSIZEX = 8; // default size
|
|
const int VSIZEL = 16; // large size
|
|
#elif defined(__AVX512F__) // KNL
|
|
const int VSIZEX = 16;
|
|
const int VSIZEL = 16;
|
|
#elif defined(__AVX__)
|
|
const int VSIZEX = 8;
|
|
const int VSIZEL = 8;
|
|
#else
|
|
const int VSIZEX = 4;
|
|
const int VSIZEL = 4;
|
|
#endif
|
|
|
|
/* Extends varying size N to optimal or up to max(N, N2) */
|
|
template<int N, int N2 = VSIZEX>
|
|
struct vextend
|
|
{
|
|
#if defined(__AVX512F__) && !defined(__AVX512VL__) // KNL
|
|
/* use 16-wide SIMD calculations on KNL even for 4 and 8 wide SIMD */
|
|
static const int size = (N2 == VSIZEX) ? VSIZEX : N;
|
|
#define SIMD_MODE(N) N, 16
|
|
#else
|
|
/* calculate with same SIMD width otherwise */
|
|
static const int size = N;
|
|
#define SIMD_MODE(N) N, N
|
|
#endif
|
|
};
|
|
|
|
/* 4-wide shortcuts */
|
|
typedef vfloat<4> vfloat4;
|
|
typedef vdouble<4> vdouble4;
|
|
typedef vreal<4> vreal4;
|
|
typedef vint<4> vint4;
|
|
typedef vuint<4> vuint4;
|
|
typedef vllong<4> vllong4;
|
|
typedef vbool<4> vbool4;
|
|
typedef vboolf<4> vboolf4;
|
|
typedef vboold<4> vboold4;
|
|
|
|
/* 8-wide shortcuts */
|
|
typedef vfloat<8> vfloat8;
|
|
typedef vdouble<8> vdouble8;
|
|
typedef vreal<8> vreal8;
|
|
typedef vint<8> vint8;
|
|
typedef vuint<8> vuint8;
|
|
typedef vllong<8> vllong8;
|
|
typedef vbool<8> vbool8;
|
|
typedef vboolf<8> vboolf8;
|
|
typedef vboold<8> vboold8;
|
|
|
|
/* 16-wide shortcuts */
|
|
typedef vfloat<16> vfloat16;
|
|
typedef vdouble<16> vdouble16;
|
|
typedef vreal<16> vreal16;
|
|
typedef vint<16> vint16;
|
|
typedef vuint<16> vuint16;
|
|
typedef vllong<16> vllong16;
|
|
typedef vbool<16> vbool16;
|
|
typedef vboolf<16> vboolf16;
|
|
typedef vboold<16> vboold16;
|
|
|
|
/* Default shortcuts */
|
|
typedef vfloat<VSIZEX> vfloatx;
|
|
typedef vdouble<VSIZEX> vdoublex;
|
|
typedef vreal<VSIZEX> vrealx;
|
|
typedef vint<VSIZEX> vintx;
|
|
typedef vuint<VSIZEX> vuintx;
|
|
typedef vllong<VSIZEX> vllongx;
|
|
typedef vbool<VSIZEX> vboolx;
|
|
typedef vboolf<VSIZEX> vboolfx;
|
|
typedef vboold<VSIZEX> vbooldx;
|
|
}
|