1 /* Copyright (C) 2006 Free Software Foundation, Inc.
3 This file is part of GCC.
5 GCC is free software; you can redistribute it and/or modify
6 it under the terms of the GNU General Public License as published by
7 the Free Software Foundation; either version 2, or (at your option)
10 GCC is distributed in the hope that it will be useful,
11 but WITHOUT ANY WARRANTY; without even the implied warranty of
12 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 GNU General Public License for more details.
15 You should have received a copy of the GNU General Public License
16 along with GCC; see the file COPYING. If not, write to
17 the Free Software Foundation, 59 Temple Place - Suite 330,
18 Boston, MA 02111-1307, USA. */
20 /* As a special exception, if you include this header file into source
21 files compiled by GCC, this header file does not by itself cause
22 the resulting executable to be covered by the GNU General Public
23 License. This exception does not however invalidate any other
24 reasons why the executable file might be covered by the GNU General
27 /* Implemented from the specification included in the Intel C++ Compiler
28 User Guide and Reference, version 9.1. */
30 #ifndef _TMMINTRIN_H_INCLUDED
31 #define _TMMINTRIN_H_INCLUDED
34 #include <pmmintrin.h>
36 static __inline __m128i __attribute__((__always_inline__))
37 _mm_hadd_epi16 (__m128i __X, __m128i __Y)
39 return (__m128i) __builtin_ia32_phaddw128 ((__v8hi)__X, (__v8hi)__Y);
42 static __inline __m128i __attribute__((__always_inline__))
43 _mm_hadd_epi32 (__m128i __X, __m128i __Y)
45 return (__m128i) __builtin_ia32_phaddd128 ((__v4si)__X, (__v4si)__Y);
48 static __inline __m128i __attribute__((__always_inline__))
49 _mm_hadds_epi16 (__m128i __X, __m128i __Y)
51 return (__m128i) __builtin_ia32_phaddsw128 ((__v8hi)__X, (__v8hi)__Y);
54 static __inline __m64 __attribute__((__always_inline__))
55 _mm_hadd_pi16 (__m64 __X, __m64 __Y)
57 return (__m64) __builtin_ia32_phaddw ((__v4hi)__X, (__v4hi)__Y);
60 static __inline __m64 __attribute__((__always_inline__))
61 _mm_hadd_pi32 (__m64 __X, __m64 __Y)
63 return (__m64) __builtin_ia32_phaddd ((__v2si)__X, (__v2si)__Y);
66 static __inline __m64 __attribute__((__always_inline__))
67 _mm_hadds_pi16 (__m64 __X, __m64 __Y)
69 return (__m64) __builtin_ia32_phaddsw ((__v4hi)__X, (__v4hi)__Y);
72 static __inline __m128i __attribute__((__always_inline__))
73 _mm_hsub_epi16 (__m128i __X, __m128i __Y)
75 return (__m128i) __builtin_ia32_phsubw128 ((__v8hi)__X, (__v8hi)__Y);
78 static __inline __m128i __attribute__((__always_inline__))
79 _mm_hsub_epi32 (__m128i __X, __m128i __Y)
81 return (__m128i) __builtin_ia32_phsubd128 ((__v4si)__X, (__v4si)__Y);
84 static __inline __m128i __attribute__((__always_inline__))
85 _mm_hsubs_epi16 (__m128i __X, __m128i __Y)
87 return (__m128i) __builtin_ia32_phsubsw128 ((__v8hi)__X, (__v8hi)__Y);
90 static __inline __m64 __attribute__((__always_inline__))
91 _mm_hsub_pi16 (__m64 __X, __m64 __Y)
93 return (__m64) __builtin_ia32_phsubw ((__v4hi)__X, (__v4hi)__Y);
96 static __inline __m64 __attribute__((__always_inline__))
97 _mm_hsub_pi32 (__m64 __X, __m64 __Y)
99 return (__m64) __builtin_ia32_phsubd ((__v2si)__X, (__v2si)__Y);
102 static __inline __m64 __attribute__((__always_inline__))
103 _mm_hsubs_pi16 (__m64 __X, __m64 __Y)
105 return (__m64) __builtin_ia32_phsubsw ((__v4hi)__X, (__v4hi)__Y);
108 static __inline __m128i __attribute__((__always_inline__))
109 _mm_maddubs_epi16 (__m128i __X, __m128i __Y)
111 return (__m128i) __builtin_ia32_pmaddubsw128 ((__v16qi)__X, (__v16qi)__Y);
114 static __inline __m64 __attribute__((__always_inline__))
115 _mm_maddubs_pi16 (__m64 __X, __m64 __Y)
117 return (__m64) __builtin_ia32_pmaddubsw ((__v8qi)__X, (__v8qi)__Y);
120 static __inline __m128i __attribute__((__always_inline__))
121 _mm_mulhrs_epi16 (__m128i __X, __m128i __Y)
123 return (__m128i) __builtin_ia32_pmulhrsw128 ((__v8hi)__X, (__v8hi)__Y);
126 static __inline __m64 __attribute__((__always_inline__))
127 _mm_mulhrs_pi16 (__m64 __X, __m64 __Y)
129 return (__m64) __builtin_ia32_pmulhrsw ((__v4hi)__X, (__v4hi)__Y);
132 static __inline __m128i __attribute__((__always_inline__))
133 _mm_shuffle_epi8 (__m128i __X, __m128i __Y)
135 return (__m128i) __builtin_ia32_pshufb128 ((__v16qi)__X, (__v16qi)__Y);
138 static __inline __m64 __attribute__((__always_inline__))
139 _mm_shuffle_pi8 (__m64 __X, __m64 __Y)
141 return (__m64) __builtin_ia32_pshufb ((__v8qi)__X, (__v8qi)__Y);
144 static __inline __m128i __attribute__((__always_inline__))
145 _mm_sign_epi8 (__m128i __X, __m128i __Y)
147 return (__m128i) __builtin_ia32_psignb128 ((__v16qi)__X, (__v16qi)__Y);
150 static __inline __m128i __attribute__((__always_inline__))
151 _mm_sign_epi16 (__m128i __X, __m128i __Y)
153 return (__m128i) __builtin_ia32_psignw128 ((__v8hi)__X, (__v8hi)__Y);
156 static __inline __m128i __attribute__((__always_inline__))
157 _mm_sign_epi32 (__m128i __X, __m128i __Y)
159 return (__m128i) __builtin_ia32_psignd128 ((__v4si)__X, (__v4si)__Y);
162 static __inline __m64 __attribute__((__always_inline__))
163 _mm_sign_pi8 (__m64 __X, __m64 __Y)
165 return (__m64) __builtin_ia32_psignb ((__v8qi)__X, (__v8qi)__Y);
168 static __inline __m64 __attribute__((__always_inline__))
169 _mm_sign_pi16 (__m64 __X, __m64 __Y)
171 return (__m64) __builtin_ia32_psignw ((__v4hi)__X, (__v4hi)__Y);
174 static __inline __m64 __attribute__((__always_inline__))
175 _mm_sign_pi32 (__m64 __X, __m64 __Y)
177 return (__m64) __builtin_ia32_psignd ((__v2si)__X, (__v2si)__Y);
180 #define _mm_alignr_epi8(__X, __Y, __N) \
181 ((__m128i)__builtin_ia32_palignr128 ((__v2di) __X, (__v2di) __Y, (__N) * 8))
183 #define _mm_alignr_pi8(__X, __Y, __N) \
184 ((__m64)__builtin_ia32_palignr ((long long) (__X), (long long) (__Y), (__N) * 8))
186 static __inline __m128i __attribute__((__always_inline__))
187 _mm_abs_epi8 (__m128i __X)
189 return (__m128i) __builtin_ia32_pabsb128 ((__v16qi)__X);
192 static __inline __m128i __attribute__((__always_inline__))
193 _mm_abs_epi16 (__m128i __X)
195 return (__m128i) __builtin_ia32_pabsw128 ((__v8hi)__X);
198 static __inline __m128i __attribute__((__always_inline__))
199 _mm_abs_epi32 (__m128i __X)
201 return (__m128i) __builtin_ia32_pabsd128 ((__v4si)__X);
204 static __inline __m64 __attribute__((__always_inline__))
205 _mm_abs_pi8 (__m64 __X)
207 return (__m64) __builtin_ia32_pabsb ((__v8qi)__X);
210 static __inline __m64 __attribute__((__always_inline__))
211 _mm_abs_pi16 (__m64 __X)
213 return (__m64) __builtin_ia32_pabsw ((__v4hi)__X);
216 static __inline __m64 __attribute__((__always_inline__))
217 _mm_abs_pi32 (__m64 __X)
219 return (__m64) __builtin_ia32_pabsd ((__v2si)__X);
222 #endif /* __SSSE3__ */
224 #endif /* _TMMINTRIN_H_INCLUDED */
225 /* Copyright (C) 2006 Free Software Foundation, Inc.
227 This file is part of GCC.
229 GCC is free software; you can redistribute it and/or modify
230 it under the terms of the GNU General Public License as published by
231 the Free Software Foundation; either version 2, or (at your option)
234 GCC is distributed in the hope that it will be useful,
235 but WITHOUT ANY WARRANTY; without even the implied warranty of
236 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
237 GNU General Public License for more details.
239 You should have received a copy of the GNU General Public License
240 along with GCC; see the file COPYING. If not, write to
241 the Free Software Foundation, 59 Temple Place - Suite 330,
242 Boston, MA 02111-1307, USA. */
244 /* As a special exception, if you include this header file into source
245 files compiled by GCC, this header file does not by itself cause
246 the resulting executable to be covered by the GNU General Public
247 License. This exception does not however invalidate any other
248 reasons why the executable file might be covered by the GNU General
251 /* Implemented from the specification included in the Intel C++ Compiler
252 User Guide and Reference, version 9.1. */
254 #ifndef _TMMINTRIN_H_INCLUDED
255 #define _TMMINTRIN_H_INCLUDED
258 #include <pmmintrin.h>
260 static __inline __m128i __attribute__((__always_inline__))
261 _mm_hadd_epi16 (__m128i __X, __m128i __Y)
263 return (__m128i) __builtin_ia32_phaddw128 ((__v8hi)__X, (__v8hi)__Y);
266 static __inline __m128i __attribute__((__always_inline__))
267 _mm_hadd_epi32 (__m128i __X, __m128i __Y)
269 return (__m128i) __builtin_ia32_phaddd128 ((__v4si)__X, (__v4si)__Y);
272 static __inline __m128i __attribute__((__always_inline__))
273 _mm_hadds_epi16 (__m128i __X, __m128i __Y)
275 return (__m128i) __builtin_ia32_phaddsw128 ((__v8hi)__X, (__v8hi)__Y);
278 static __inline __m64 __attribute__((__always_inline__))
279 _mm_hadd_pi16 (__m64 __X, __m64 __Y)
281 return (__m64) __builtin_ia32_phaddw ((__v4hi)__X, (__v4hi)__Y);
284 static __inline __m64 __attribute__((__always_inline__))
285 _mm_hadd_pi32 (__m64 __X, __m64 __Y)
287 return (__m64) __builtin_ia32_phaddd ((__v2si)__X, (__v2si)__Y);
290 static __inline __m64 __attribute__((__always_inline__))
291 _mm_hadds_pi16 (__m64 __X, __m64 __Y)
293 return (__m64) __builtin_ia32_phaddsw ((__v4hi)__X, (__v4hi)__Y);
296 static __inline __m128i __attribute__((__always_inline__))
297 _mm_hsub_epi16 (__m128i __X, __m128i __Y)
299 return (__m128i) __builtin_ia32_phsubw128 ((__v8hi)__X, (__v8hi)__Y);
302 static __inline __m128i __attribute__((__always_inline__))
303 _mm_hsub_epi32 (__m128i __X, __m128i __Y)
305 return (__m128i) __builtin_ia32_phsubd128 ((__v4si)__X, (__v4si)__Y);
308 static __inline __m128i __attribute__((__always_inline__))
309 _mm_hsubs_epi16 (__m128i __X, __m128i __Y)
311 return (__m128i) __builtin_ia32_phsubsw128 ((__v8hi)__X, (__v8hi)__Y);
314 static __inline __m64 __attribute__((__always_inline__))
315 _mm_hsub_pi16 (__m64 __X, __m64 __Y)
317 return (__m64) __builtin_ia32_phsubw ((__v4hi)__X, (__v4hi)__Y);
320 static __inline __m64 __attribute__((__always_inline__))
321 _mm_hsub_pi32 (__m64 __X, __m64 __Y)
323 return (__m64) __builtin_ia32_phsubd ((__v2si)__X, (__v2si)__Y);
326 static __inline __m64 __attribute__((__always_inline__))
327 _mm_hsubs_pi16 (__m64 __X, __m64 __Y)
329 return (__m64) __builtin_ia32_phsubsw ((__v4hi)__X, (__v4hi)__Y);
332 static __inline __m128i __attribute__((__always_inline__))
333 _mm_maddubs_epi16 (__m128i __X, __m128i __Y)
335 return (__m128i) __builtin_ia32_pmaddubsw128 ((__v16qi)__X, (__v16qi)__Y);
338 static __inline __m64 __attribute__((__always_inline__))
339 _mm_maddubs_pi16 (__m64 __X, __m64 __Y)
341 return (__m64) __builtin_ia32_pmaddubsw ((__v8qi)__X, (__v8qi)__Y);
344 static __inline __m128i __attribute__((__always_inline__))
345 _mm_mulhrs_epi16 (__m128i __X, __m128i __Y)
347 return (__m128i) __builtin_ia32_pmulhrsw128 ((__v8hi)__X, (__v8hi)__Y);
350 static __inline __m64 __attribute__((__always_inline__))
351 _mm_mulhrs_pi16 (__m64 __X, __m64 __Y)
353 return (__m64) __builtin_ia32_pmulhrsw ((__v4hi)__X, (__v4hi)__Y);
356 static __inline __m128i __attribute__((__always_inline__))
357 _mm_shuffle_epi8 (__m128i __X, __m128i __Y)
359 return (__m128i) __builtin_ia32_pshufb128 ((__v16qi)__X, (__v16qi)__Y);
362 static __inline __m64 __attribute__((__always_inline__))
363 _mm_shuffle_pi8 (__m64 __X, __m64 __Y)
365 return (__m64) __builtin_ia32_pshufb ((__v8qi)__X, (__v8qi)__Y);
368 static __inline __m128i __attribute__((__always_inline__))
369 _mm_sign_epi8 (__m128i __X, __m128i __Y)
371 return (__m128i) __builtin_ia32_psignb128 ((__v16qi)__X, (__v16qi)__Y);
374 static __inline __m128i __attribute__((__always_inline__))
375 _mm_sign_epi16 (__m128i __X, __m128i __Y)
377 return (__m128i) __builtin_ia32_psignw128 ((__v8hi)__X, (__v8hi)__Y);
380 static __inline __m128i __attribute__((__always_inline__))
381 _mm_sign_epi32 (__m128i __X, __m128i __Y)
383 return (__m128i) __builtin_ia32_psignd128 ((__v4si)__X, (__v4si)__Y);
386 static __inline __m64 __attribute__((__always_inline__))
387 _mm_sign_pi8 (__m64 __X, __m64 __Y)
389 return (__m64) __builtin_ia32_psignb ((__v8qi)__X, (__v8qi)__Y);
392 static __inline __m64 __attribute__((__always_inline__))
393 _mm_sign_pi16 (__m64 __X, __m64 __Y)
395 return (__m64) __builtin_ia32_psignw ((__v4hi)__X, (__v4hi)__Y);
398 static __inline __m64 __attribute__((__always_inline__))
399 _mm_sign_pi32 (__m64 __X, __m64 __Y)
401 return (__m64) __builtin_ia32_psignd ((__v2si)__X, (__v2si)__Y);
404 #define _mm_alignr_epi8(__X, __Y, __N) \
405 ((__m128i)__builtin_ia32_palignr128 ((__v2di) __X, (__v2di) __Y, (__N) * 8))
407 #define _mm_alignr_pi8(__X, __Y, __N) \
408 ((__m64)__builtin_ia32_palignr ((long long) (__X), (long long) (__Y), (__N) * 8))
410 static __inline __m128i __attribute__((__always_inline__))
411 _mm_abs_epi8 (__m128i __X)
413 return (__m128i) __builtin_ia32_pabsb128 ((__v16qi)__X);
416 static __inline __m128i __attribute__((__always_inline__))
417 _mm_abs_epi16 (__m128i __X)
419 return (__m128i) __builtin_ia32_pabsw128 ((__v8hi)__X);
422 static __inline __m128i __attribute__((__always_inline__))
423 _mm_abs_epi32 (__m128i __X)
425 return (__m128i) __builtin_ia32_pabsd128 ((__v4si)__X);
428 static __inline __m64 __attribute__((__always_inline__))
429 _mm_abs_pi8 (__m64 __X)
431 return (__m64) __builtin_ia32_pabsb ((__v8qi)__X);
434 static __inline __m64 __attribute__((__always_inline__))
435 _mm_abs_pi16 (__m64 __X)
437 return (__m64) __builtin_ia32_pabsw ((__v4hi)__X);
440 static __inline __m64 __attribute__((__always_inline__))
441 _mm_abs_pi32 (__m64 __X)
443 return (__m64) __builtin_ia32_pabsd ((__v2si)__X);
446 #endif /* __SSSE3__ */
448 #endif /* _TMMINTRIN_H_INCLUDED */