blob: c21bbfda724d43647f03aa39555e78f6836712e6 (
plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
|
#ifndef _NPY_SIMD_H_
#error "Not a standalone header"
#endif
#define NPY_SIMD 128
#define NPY_SIMD_WIDTH 16
#define NPY_SIMD_F32 1
#define NPY_SIMD_F64 1
#if defined(NPY_HAVE_FMA3) || defined(NPY_HAVE_FMA4)
#define NPY_SIMD_FMA3 1 // native support
#else
#define NPY_SIMD_FMA3 0 // fast emulated
#endif
#define NPY_SIMD_BIGENDIAN 0
typedef __m128i npyv_u8;
typedef __m128i npyv_s8;
typedef __m128i npyv_u16;
typedef __m128i npyv_s16;
typedef __m128i npyv_u32;
typedef __m128i npyv_s32;
typedef __m128i npyv_u64;
typedef __m128i npyv_s64;
typedef __m128 npyv_f32;
typedef __m128d npyv_f64;
typedef __m128i npyv_b8;
typedef __m128i npyv_b16;
typedef __m128i npyv_b32;
typedef __m128i npyv_b64;
typedef struct { __m128i val[2]; } npyv_m128ix2;
typedef npyv_m128ix2 npyv_u8x2;
typedef npyv_m128ix2 npyv_s8x2;
typedef npyv_m128ix2 npyv_u16x2;
typedef npyv_m128ix2 npyv_s16x2;
typedef npyv_m128ix2 npyv_u32x2;
typedef npyv_m128ix2 npyv_s32x2;
typedef npyv_m128ix2 npyv_u64x2;
typedef npyv_m128ix2 npyv_s64x2;
typedef struct { __m128i val[3]; } npyv_m128ix3;
typedef npyv_m128ix3 npyv_u8x3;
typedef npyv_m128ix3 npyv_s8x3;
typedef npyv_m128ix3 npyv_u16x3;
typedef npyv_m128ix3 npyv_s16x3;
typedef npyv_m128ix3 npyv_u32x3;
typedef npyv_m128ix3 npyv_s32x3;
typedef npyv_m128ix3 npyv_u64x3;
typedef npyv_m128ix3 npyv_s64x3;
typedef struct { __m128 val[2]; } npyv_f32x2;
typedef struct { __m128d val[2]; } npyv_f64x2;
typedef struct { __m128 val[3]; } npyv_f32x3;
typedef struct { __m128d val[3]; } npyv_f64x3;
#define npyv_nlanes_u8 16
#define npyv_nlanes_s8 16
#define npyv_nlanes_u16 8
#define npyv_nlanes_s16 8
#define npyv_nlanes_u32 4
#define npyv_nlanes_s32 4
#define npyv_nlanes_u64 2
#define npyv_nlanes_s64 2
#define npyv_nlanes_f32 4
#define npyv_nlanes_f64 2
#include "utils.h"
#include "memory.h"
#include "misc.h"
#include "reorder.h"
#include "operators.h"
#include "conversion.h"
#include "arithmetic.h"
#include "math.h"
|