1 // RUN: %clang_cc1 %s -O3 -triple=x86_64-apple-darwin -target-feature +fma4 -emit-llvm -o - | FileCheck %s
3 // Don't include mm_malloc.h, it's system specific.
8 __m128 test_mm_macc_ps(__m128 a, __m128 b, __m128 c) {
9 // CHECK: @llvm.x86.fma.vfmadd.ps
10 return _mm_macc_ps(a, b, c);
13 __m128d test_mm_macc_pd(__m128d a, __m128d b, __m128d c) {
14 // CHECK: @llvm.x86.fma.vfmadd.pd
15 return _mm_macc_pd(a, b, c);
18 __m128 test_mm_macc_ss(__m128 a, __m128 b, __m128 c) {
19 // CHECK: @llvm.x86.fma.vfmadd.ss
20 return _mm_macc_ss(a, b, c);
23 __m128d test_mm_macc_sd(__m128d a, __m128d b, __m128d c) {
24 // CHECK: @llvm.x86.fma.vfmadd.sd
25 return _mm_macc_sd(a, b, c);
28 __m128 test_mm_msub_ps(__m128 a, __m128 b, __m128 c) {
29 // CHECK: @llvm.x86.fma.vfmsub.ps
30 return _mm_msub_ps(a, b, c);
33 __m128d test_mm_msub_pd(__m128d a, __m128d b, __m128d c) {
34 // CHECK: @llvm.x86.fma.vfmsub.pd
35 return _mm_msub_pd(a, b, c);
38 __m128 test_mm_msub_ss(__m128 a, __m128 b, __m128 c) {
39 // CHECK: @llvm.x86.fma.vfmsub.ss
40 return _mm_msub_ss(a, b, c);
43 __m128d test_mm_msub_sd(__m128d a, __m128d b, __m128d c) {
44 // CHECK: @llvm.x86.fma.vfmsub.sd
45 return _mm_msub_sd(a, b, c);
48 __m128 test_mm_nmacc_ps(__m128 a, __m128 b, __m128 c) {
49 // CHECK: @llvm.x86.fma.vfnmadd.ps
50 return _mm_nmacc_ps(a, b, c);
53 __m128d test_mm_nmacc_pd(__m128d a, __m128d b, __m128d c) {
54 // CHECK: @llvm.x86.fma.vfnmadd.pd
55 return _mm_nmacc_pd(a, b, c);
58 __m128 test_mm_nmacc_ss(__m128 a, __m128 b, __m128 c) {
59 // CHECK: @llvm.x86.fma.vfnmadd.ss
60 return _mm_nmacc_ss(a, b, c);
63 __m128d test_mm_nmacc_sd(__m128d a, __m128d b, __m128d c) {
64 // CHECK: @llvm.x86.fma.vfnmadd.sd
65 return _mm_nmacc_sd(a, b, c);
68 __m128 test_mm_nmsub_ps(__m128 a, __m128 b, __m128 c) {
69 // CHECK: @llvm.x86.fma.vfnmsub.ps
70 return _mm_nmsub_ps(a, b, c);
73 __m128d test_mm_nmsub_pd(__m128d a, __m128d b, __m128d c) {
74 // CHECK: @llvm.x86.fma.vfnmsub.pd
75 return _mm_nmsub_pd(a, b, c);
78 __m128 test_mm_nmsub_ss(__m128 a, __m128 b, __m128 c) {
79 // CHECK: @llvm.x86.fma.vfnmsub.ss
80 return _mm_nmsub_ss(a, b, c);
83 __m128d test_mm_nmsub_sd(__m128d a, __m128d b, __m128d c) {
84 // CHECK: @llvm.x86.fma.vfnmsub.sd
85 return _mm_nmsub_sd(a, b, c);
88 __m128 test_mm_maddsub_ps(__m128 a, __m128 b, __m128 c) {
89 // CHECK: @llvm.x86.fma.vfmaddsub.ps
90 return _mm_maddsub_ps(a, b, c);
93 __m128d test_mm_maddsub_pd(__m128d a, __m128d b, __m128d c) {
94 // CHECK: @llvm.x86.fma.vfmaddsub.pd
95 return _mm_maddsub_pd(a, b, c);
98 __m128 test_mm_msubadd_ps(__m128 a, __m128 b, __m128 c) {
99 // CHECK: @llvm.x86.fma.vfmsubadd.ps
100 return _mm_msubadd_ps(a, b, c);
103 __m128d test_mm_msubadd_pd(__m128d a, __m128d b, __m128d c) {
104 // CHECK: @llvm.x86.fma.vfmsubadd.pd
105 return _mm_msubadd_pd(a, b, c);
108 __m256 test_mm256_macc_ps(__m256 a, __m256 b, __m256 c) {
109 // CHECK: @llvm.x86.fma.vfmadd.ps.256
110 return _mm256_macc_ps(a, b, c);
113 __m256d test_mm256_macc_pd(__m256d a, __m256d b, __m256d c) {
114 // CHECK: @llvm.x86.fma.vfmadd.pd.256
115 return _mm256_macc_pd(a, b, c);
118 __m256 test_mm256_msub_ps(__m256 a, __m256 b, __m256 c) {
119 // CHECK: @llvm.x86.fma.vfmsub.ps.256
120 return _mm256_msub_ps(a, b, c);
123 __m256d test_mm256_msub_pd(__m256d a, __m256d b, __m256d c) {
124 // CHECK: @llvm.x86.fma.vfmsub.pd.256
125 return _mm256_msub_pd(a, b, c);
128 __m256 test_mm256_nmacc_ps(__m256 a, __m256 b, __m256 c) {
129 // CHECK: @llvm.x86.fma.vfnmadd.ps.256
130 return _mm256_nmacc_ps(a, b, c);
133 __m256d test_mm256_nmacc_pd(__m256d a, __m256d b, __m256d c) {
134 // CHECK: @llvm.x86.fma.vfnmadd.pd.256
135 return _mm256_nmacc_pd(a, b, c);
138 __m256 test_mm256_nmsub_ps(__m256 a, __m256 b, __m256 c) {
139 // CHECK: @llvm.x86.fma.vfnmsub.ps.256
140 return _mm256_nmsub_ps(a, b, c);
143 __m256d test_mm256_nmsub_pd(__m256d a, __m256d b, __m256d c) {
144 // CHECK: @llvm.x86.fma.vfnmsub.pd.256
145 return _mm256_nmsub_pd(a, b, c);
148 __m256 test_mm256_maddsub_ps(__m256 a, __m256 b, __m256 c) {
149 // CHECK: @llvm.x86.fma.vfmaddsub.ps.256
150 return _mm256_maddsub_ps(a, b, c);
153 __m256d test_mm256_maddsub_pd(__m256d a, __m256d b, __m256d c) {
154 // CHECK: @llvm.x86.fma.vfmaddsub.pd.256
155 return _mm256_maddsub_pd(a, b, c);
158 __m256 test_mm256_msubadd_ps(__m256 a, __m256 b, __m256 c) {
159 // CHECK: @llvm.x86.fma.vfmsubadd.ps.256
160 return _mm256_msubadd_ps(a, b, c);
163 __m256d test_mm256_msubadd_pd(__m256d a, __m256d b, __m256d c) {
164 // CHECK: @llvm.x86.fma.vfmsubadd.pd.256
165 return _mm256_msubadd_pd(a, b, c);