-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathxmmintrin.pxd
281 lines (170 loc) · 7.81 KB
/
xmmintrin.pxd
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
# -*- coding: utf-8 -*-
# xmmintrin.pxd
include "mmintrin.pxd"
cdef extern from "xmmintrin.h":
ctypedef int __v4si
ctypedef float __v4sf
ctypedef float __m128
ctypedef unsigned int __v4su
cdef enum _mm_hint:
_MM_HINT_ET0
_MM_HINT_ET1
_MM_HINT_T0
_MM_HINT_T1
_MM_HINT_T2
_MM_HINT_NTA
__m128 _mm_add_ps (__m128 a, __m128 b) nogil
__m128 _mm_add_ss (__m128 a, __m128 b) nogil
__m128 _mm_and_ps (__m128 a, __m128 b) nogil
__m128 _mm_andnot_ps (__m128 a, __m128 b) nogil
__m64 _mm_avg_pu16 (__m64 a, __m64 b) nogil
__m64 _mm_avg_pu8 (__m64 a, __m64 b) nogil
__m128 _mm_cmpeq_ps (__m128 a, __m128 b) nogil
__m128 _mm_cmpeq_ss (__m128 a, __m128 b) nogil
__m128 _mm_cmpge_ps (__m128 a, __m128 b) nogil
__m128 _mm_cmpge_ss (__m128 a, __m128 b) nogil
__m128 _mm_cmpgt_ps (__m128 a, __m128 b) nogil
__m128 _mm_cmpgt_ss (__m128 a, __m128 b) nogil
__m128 _mm_cmple_ps (__m128 a, __m128 b) nogil
__m128 _mm_cmple_ss (__m128 a, __m128 b) nogil
__m128 _mm_cmplt_ps (__m128 a, __m128 b) nogil
__m128 _mm_cmplt_ss (__m128 a, __m128 b) nogil
__m128 _mm_cmpneq_ps (__m128 a, __m128 b) nogil
__m128 _mm_cmpneq_ss (__m128 a, __m128 b) nogil
__m128 _mm_cmpnge_ps (__m128 a, __m128 b) nogil
__m128 _mm_cmpnge_ss (__m128 a, __m128 b) nogil
__m128 _mm_cmpngt_ps (__m128 a, __m128 b) nogil
__m128 _mm_cmpngt_ss (__m128 a, __m128 b) nogil
__m128 _mm_cmpnle_ps (__m128 a, __m128 b) nogil
__m128 _mm_cmpnle_ss (__m128 a, __m128 b) nogil
__m128 _mm_cmpnlt_ps (__m128 a, __m128 b) nogil
__m128 _mm_cmpnlt_ss (__m128 a, __m128 b) nogil
__m128 _mm_cmpord_ps (__m128 a, __m128 b) nogil
__m128 _mm_cmpord_ss (__m128 a, __m128 b) nogil
__m128 _mm_cmpunord_ps (__m128 a, __m128 b) nogil
__m128 _mm_cmpunord_ss (__m128 a, __m128 b) nogil
int _mm_comieq_ss (__m128 a, __m128 b) nogil
int _mm_comige_ss (__m128 a, __m128 b) nogil
int _mm_comigt_ss (__m128 a, __m128 b) nogil
int _mm_comile_ss (__m128 a, __m128 b) nogil
int _mm_comilt_ss (__m128 a, __m128 b) nogil
int _mm_comineq_ss (__m128 a, __m128 b) nogil
__m128 _mm_cvt_pi2ps (__m128 a, __m64 b) nogil
__m64 _mm_cvt_ps2pi (__m128 a) nogil
__m128 _mm_cvt_si2ss (__m128 a, int b) nogil
int _mm_cvt_ss2si (__m128 a) nogil
__m128 _mm_cvtpi16_ps (__m64 a) nogil
__m128 _mm_cvtpi32_ps (__m128 a, __m64 b) nogil
__m128 _mm_cvtpi32x2_ps (__m64 a, __m64 b) nogil
__m128 _mm_cvtpi8_ps (__m64 a) nogil
__m64 _mm_cvtps_pi16 (__m128 a) nogil
__m64 _mm_cvtps_pi32 (__m128 a) nogil
__m64 _mm_cvtps_pi8 (__m128 a) nogil
__m128 _mm_cvtpu16_ps (__m64 a) nogil
__m128 _mm_cvtpu8_ps (__m64 a) nogil
__m128 _mm_cvtsi32_ss (__m128 a, int b) nogil
__m128 _mm_cvtsi64_ss (__m128 a, __int64 b) nogil
float _mm_cvtss_f32 (__m128 a) nogil
int _mm_cvtss_si32 (__m128 a) nogil
__int64 _mm_cvtss_si64 (__m128 a) nogil
__m64 _mm_cvtt_ps2pi (__m128 a) nogil
int _mm_cvtt_ss2si (__m128 a) nogil
__m64 _mm_cvttps_pi32 (__m128 a) nogil
int _mm_cvttss_si32 (__m128 a) nogil
__int64 _mm_cvttss_si64 (__m128 a) nogil
__m128 _mm_div_ps (__m128 a, __m128 b) nogil
__m128 _mm_div_ss (__m128 a, __m128 b) nogil
int _mm_extract_pi16 (__m64 a, int imm8) nogil
void _mm_free (void * mem_addr) nogil
unsigned int _MM_GET_EXCEPTION_MASK () nogil
unsigned int _MM_GET_EXCEPTION_STATE () nogil
unsigned int _MM_GET_FLUSH_ZERO_MODE () nogil
unsigned int _MM_GET_ROUNDING_MODE () nogil
unsigned int _mm_getcsr () nogil
__m64 _mm_insert_pi16 (__m64 a, int i, int imm8) nogil
__m128 _mm_load_ps (float * mem_addr) nogil
__m128 _mm_load_ps1 (float * mem_addr) nogil
__m128 _mm_load_ss (float * mem_addr) nogil
__m128 _mm_load1_ps (float * mem_addr) nogil
__m128 _mm_loadh_pi (__m128 a, __m64 * mem_addr) nogil
__m128 _mm_loadl_pi (__m128 a, __m64 * mem_addr) nogil
__m128 _mm_loadr_ps (float * mem_addr) nogil
__m128 _mm_loadu_ps (float * mem_addr) nogil
void* _mm_malloc (size_t size, size_t align) nogil
void _mm_maskmove_si64 (__m64 a, __m64 mask, char* mem_addr) nogil
void _m_maskmovq (__m64 a, __m64 mask, char* mem_addr) nogil
__m64 _mm_max_pi16 (__m64 a, __m64 b) nogil
__m128 _mm_max_ps (__m128 a, __m128 b) nogil
__m64 _mm_max_pu8 (__m64 a, __m64 b) nogil
__m128 _mm_max_ss (__m128 a, __m128 b) nogil
__m64 _mm_min_pi16 (__m64 a, __m64 b) nogil
__m128 _mm_min_ps (__m128 a, __m128 b) nogil
__m64 _mm_min_pu8 (__m64 a, __m64 b) nogil
__m128 _mm_min_ss (__m128 a, __m128 b) nogil
__m128 _mm_move_ss (__m128 a, __m128 b) nogil
__m128 _mm_movehl_ps (__m128 a, __m128 b) nogil
__m128 _mm_movelh_ps (__m128 a, __m128 b) nogil
int _mm_movemask_pi8 (__m64 a) nogil
int _mm_movemask_ps (__m128 a) nogil
__m128 _mm_mul_ps (__m128 a, __m128 b) nogil
__m128 _mm_mul_ss (__m128 a, __m128 b) nogil
__m64 _mm_mulhi_pu16 (__m64 a, __m64 b) nogil
__m128 _mm_or_ps (__m128 a, __m128 b) nogil
__m64 _m_pavgb (__m64 a, __m64 b) nogil
__m64 _m_pavgw (__m64 a, __m64 b) nogil
int _m_pextrw (__m64 a, int imm8) nogil
__m64 _m_pinsrw (__m64 a, int i, int imm8) nogil
__m64 _m_pmaxsw (__m64 a, __m64 b) nogil
__m64 _m_pmaxub (__m64 a, __m64 b) nogil
__m64 _m_pminsw (__m64 a, __m64 b) nogil
__m64 _m_pminub (__m64 a, __m64 b) nogil
int _m_pmovmskb (__m64 a) nogil
__m64 _m_pmulhuw (__m64 a, __m64 b) nogil
void _mm_prefetch (char * p, int i) nogil
void _mm_prefetch (char * p, int i) nogil
void _mm_prefetch (char * p, int i) nogil
__m64 _m_psadbw (__m64 a, __m64 b) nogil
__m64 _m_pshufw (__m64 a, int imm8) nogil
__m128 _mm_rcp_ps (__m128 a) nogil
__m128 _mm_rcp_ss (__m128 a) nogil
__m128 _mm_rsqrt_ps (__m128 a) nogil
__m128 _mm_rsqrt_ss (__m128 a) nogil
__m64 _mm_sad_pu8 (__m64 a, __m64 b) nogil
void _MM_SET_EXCEPTION_MASK (unsigned int a) nogil
void _MM_SET_EXCEPTION_STATE (unsigned int a) nogil
void _MM_SET_FLUSH_ZERO_MODE (unsigned int a) nogil
__m128 _mm_set_ps (float e3, float e2, float e1, float e0) nogil
__m128 _mm_set_ps1 (float a) nogil
void _MM_SET_ROUNDING_MODE (unsigned int a) nogil
__m128 _mm_set_ss (float a) nogil
__m128 _mm_set1_ps (float a) nogil
void _mm_setcsr (unsigned int a) nogil
__m128 _mm_setr_ps (float e3, float e2, float e1, float e0) nogil
__m128 _mm_setzero_ps () nogil
void _mm_sfence () nogil
__m64 _mm_shuffle_pi16 (__m64 a, int imm8) nogil
__m128 _mm_shuffle_ps (__m128 a, __m128 b, unsigned int imm8) nogil
__m128 _mm_sqrt_ps (__m128 a) nogil
__m128 _mm_sqrt_ss (__m128 a) nogil
void _mm_store_ps (float* mem_addr, __m128 a) nogil
void _mm_store_ps1 (float* mem_addr, __m128 a) nogil
void _mm_store_ss (float* mem_addr, __m128 a) nogil
void _mm_store1_ps (float* mem_addr, __m128 a) nogil
void _mm_storeh_pi (__m64* mem_addr, __m128 a) nogil
void _mm_storel_pi (__m64* mem_addr, __m128 a) nogil
void _mm_storer_ps (float* mem_addr, __m128 a) nogil
void _mm_storeu_ps (float* mem_addr, __m128 a) nogil
void _mm_stream_pi (__m64* mem_addr, __m64 a) nogil
void _mm_stream_ps (float* mem_addr, __m128 a) nogil
__m128 _mm_sub_ps (__m128 a, __m128 b) nogil
__m128 _mm_sub_ss (__m128 a, __m128 b) nogil
_MM_TRANSPOSE4_PS (__m128 row0, __m128 row1, __m128 row2, __m128 row3) nogil
int _mm_ucomieq_ss (__m128 a, __m128 b) nogil
int _mm_ucomige_ss (__m128 a, __m128 b) nogil
int _mm_ucomigt_ss (__m128 a, __m128 b) nogil
int _mm_ucomile_ss (__m128 a, __m128 b) nogil
int _mm_ucomilt_ss (__m128 a, __m128 b) nogil
int _mm_ucomineq_ss (__m128 a, __m128 b) nogil
__m128 _mm_unpackhi_ps (__m128 a, __m128 b) nogil
__m128 _mm_unpacklo_ps (__m128 a, __m128 b) nogil
__m128 _mm_xor_ps (__m128 a, __m128 b) nogil