xref: /minix3/external/bsd/llvm/dist/clang/test/CodeGen/avx-builtins.c (revision 0a6a1f1d05b60e214de2f05a7310ddd1f0e590e7)
1f4a2713aSLionel Sambuc // RUN: %clang_cc1 %s -O3 -triple=x86_64-apple-darwin -target-feature +avx -emit-llvm -o - | FileCheck %s
2f4a2713aSLionel Sambuc 
3f4a2713aSLionel Sambuc // Don't include mm_malloc.h, it's system specific.
4f4a2713aSLionel Sambuc #define __MM_MALLOC_H
5f4a2713aSLionel Sambuc 
6f4a2713aSLionel Sambuc #include <immintrin.h>
7f4a2713aSLionel Sambuc 
8f4a2713aSLionel Sambuc //
9f4a2713aSLionel Sambuc // Test LLVM IR codegen of shuffle instructions
10f4a2713aSLionel Sambuc //
11f4a2713aSLionel Sambuc 
test__mm256_loadu_ps(void * p)12f4a2713aSLionel Sambuc __m256 test__mm256_loadu_ps(void* p) {
13f4a2713aSLionel Sambuc   // CHECK: load <8 x float>* %{{.*}}, align 1
14f4a2713aSLionel Sambuc   return _mm256_loadu_ps(p);
15f4a2713aSLionel Sambuc }
16f4a2713aSLionel Sambuc 
test__mm256_loadu_pd(void * p)17f4a2713aSLionel Sambuc __m256d test__mm256_loadu_pd(void* p) {
18f4a2713aSLionel Sambuc   // CHECK: load <4 x double>* %{{.*}}, align 1
19f4a2713aSLionel Sambuc   return _mm256_loadu_pd(p);
20f4a2713aSLionel Sambuc }
21f4a2713aSLionel Sambuc 
test__mm256_loadu_si256(void * p)22f4a2713aSLionel Sambuc __m256i test__mm256_loadu_si256(void* p) {
23f4a2713aSLionel Sambuc   // CHECK: load <4 x i64>* %{{.+}}, align 1
24f4a2713aSLionel Sambuc   return _mm256_loadu_si256(p);
25f4a2713aSLionel Sambuc }
26f4a2713aSLionel Sambuc 
test_mm_cmpestrm(__m128i A,int LA,__m128i B,int LB)27f4a2713aSLionel Sambuc __m128i test_mm_cmpestrm(__m128i A, int LA, __m128i B, int LB) {
28f4a2713aSLionel Sambuc   // CHECK: @llvm.x86.sse42.pcmpestrm128
29f4a2713aSLionel Sambuc   return _mm_cmpestrm(A, LA, B, LB, 7);
30f4a2713aSLionel Sambuc }
31f4a2713aSLionel Sambuc 
test_mm_cmpestri(__m128i A,int LA,__m128i B,int LB)32f4a2713aSLionel Sambuc int test_mm_cmpestri(__m128i A, int LA, __m128i B, int LB) {
33f4a2713aSLionel Sambuc   // CHECK: @llvm.x86.sse42.pcmpestri128
34f4a2713aSLionel Sambuc   return _mm_cmpestri(A, LA, B, LB, 7);
35f4a2713aSLionel Sambuc }
36f4a2713aSLionel Sambuc 
test_mm_cmpestra(__m128i A,int LA,__m128i B,int LB)37f4a2713aSLionel Sambuc int test_mm_cmpestra(__m128i A, int LA, __m128i B, int LB) {
38f4a2713aSLionel Sambuc   // CHECK: @llvm.x86.sse42.pcmpestria128
39f4a2713aSLionel Sambuc   return _mm_cmpestra(A, LA, B, LB, 7);
40f4a2713aSLionel Sambuc }
41f4a2713aSLionel Sambuc 
test_mm_cmpestrc(__m128i A,int LA,__m128i B,int LB)42f4a2713aSLionel Sambuc int test_mm_cmpestrc(__m128i A, int LA, __m128i B, int LB) {
43f4a2713aSLionel Sambuc   // CHECK: @llvm.x86.sse42.pcmpestric128
44f4a2713aSLionel Sambuc   return _mm_cmpestrc(A, LA, B, LB, 7);
45f4a2713aSLionel Sambuc }
46f4a2713aSLionel Sambuc 
test_mm_cmpestro(__m128i A,int LA,__m128i B,int LB)47f4a2713aSLionel Sambuc int test_mm_cmpestro(__m128i A, int LA, __m128i B, int LB) {
48f4a2713aSLionel Sambuc   // CHECK: @llvm.x86.sse42.pcmpestrio128
49f4a2713aSLionel Sambuc   return _mm_cmpestro(A, LA, B, LB, 7);
50f4a2713aSLionel Sambuc }
51f4a2713aSLionel Sambuc 
test_mm_cmpestrs(__m128i A,int LA,__m128i B,int LB)52f4a2713aSLionel Sambuc int test_mm_cmpestrs(__m128i A, int LA, __m128i B, int LB) {
53f4a2713aSLionel Sambuc   // CHECK: @llvm.x86.sse42.pcmpestris128
54f4a2713aSLionel Sambuc   return _mm_cmpestrs(A, LA, B, LB, 7);
55f4a2713aSLionel Sambuc }
56f4a2713aSLionel Sambuc 
test_mm_cmpestrz(__m128i A,int LA,__m128i B,int LB)57f4a2713aSLionel Sambuc int test_mm_cmpestrz(__m128i A, int LA, __m128i B, int LB) {
58f4a2713aSLionel Sambuc   // CHECK: @llvm.x86.sse42.pcmpestriz128
59f4a2713aSLionel Sambuc   return _mm_cmpestrz(A, LA, B, LB, 7);
60f4a2713aSLionel Sambuc }
61f4a2713aSLionel Sambuc 
test_mm_cmpistrm(__m128i A,__m128i B)62f4a2713aSLionel Sambuc __m128i test_mm_cmpistrm(__m128i A, __m128i B) {
63f4a2713aSLionel Sambuc   // CHECK: @llvm.x86.sse42.pcmpistrm128
64f4a2713aSLionel Sambuc   return _mm_cmpistrm(A, B, 7);
65f4a2713aSLionel Sambuc }
66f4a2713aSLionel Sambuc 
test_mm_cmpistri(__m128i A,__m128i B)67f4a2713aSLionel Sambuc int test_mm_cmpistri(__m128i A, __m128i B) {
68f4a2713aSLionel Sambuc   // CHECK: @llvm.x86.sse42.pcmpistri128
69f4a2713aSLionel Sambuc   return _mm_cmpistri(A, B, 7);
70f4a2713aSLionel Sambuc }
71f4a2713aSLionel Sambuc 
test_mm_cmpistra(__m128i A,__m128i B)72f4a2713aSLionel Sambuc int test_mm_cmpistra(__m128i A, __m128i B) {
73f4a2713aSLionel Sambuc   // CHECK: @llvm.x86.sse42.pcmpistria128
74f4a2713aSLionel Sambuc   return _mm_cmpistra(A, B, 7);
75f4a2713aSLionel Sambuc }
76f4a2713aSLionel Sambuc 
test_mm_cmpistrc(__m128i A,__m128i B)77f4a2713aSLionel Sambuc int test_mm_cmpistrc(__m128i A, __m128i B) {
78f4a2713aSLionel Sambuc   // CHECK: @llvm.x86.sse42.pcmpistric128
79f4a2713aSLionel Sambuc   return _mm_cmpistrc(A, B, 7);
80f4a2713aSLionel Sambuc }
81f4a2713aSLionel Sambuc 
test_mm_cmpistro(__m128i A,__m128i B)82f4a2713aSLionel Sambuc int test_mm_cmpistro(__m128i A, __m128i B) {
83f4a2713aSLionel Sambuc   // CHECK: @llvm.x86.sse42.pcmpistrio128
84f4a2713aSLionel Sambuc   return _mm_cmpistro(A, B, 7);
85f4a2713aSLionel Sambuc }
86f4a2713aSLionel Sambuc 
test_mm_cmpistrs(__m128i A,__m128i B)87f4a2713aSLionel Sambuc int test_mm_cmpistrs(__m128i A, __m128i B) {
88f4a2713aSLionel Sambuc   // CHECK: @llvm.x86.sse42.pcmpistris128
89f4a2713aSLionel Sambuc   return _mm_cmpistrs(A, B, 7);
90f4a2713aSLionel Sambuc }
91f4a2713aSLionel Sambuc 
test_mm_cmpistrz(__m128i A,__m128i B)92f4a2713aSLionel Sambuc int test_mm_cmpistrz(__m128i A, __m128i B) {
93f4a2713aSLionel Sambuc   // CHECK: @llvm.x86.sse42.pcmpistriz128
94f4a2713aSLionel Sambuc   return _mm_cmpistrz(A, B, 7);
95f4a2713aSLionel Sambuc }
96f4a2713aSLionel Sambuc 
test_extract_epi32(__m256i __a)97f4a2713aSLionel Sambuc int test_extract_epi32(__m256i __a) {
98f4a2713aSLionel Sambuc   // CHECK-LABEL: @test_extract_epi32
99f4a2713aSLionel Sambuc   // CHECK: extractelement <8 x i32> %{{.*}}, i32 0
100f4a2713aSLionel Sambuc   return _mm256_extract_epi32(__a, 8);
101f4a2713aSLionel Sambuc }
102f4a2713aSLionel Sambuc 
test_extract_epi16(__m256i __a)103f4a2713aSLionel Sambuc int test_extract_epi16(__m256i __a) {
104f4a2713aSLionel Sambuc   // CHECK-LABEL: @test_extract_epi16
105f4a2713aSLionel Sambuc   // CHECK: extractelement <16 x i16> %{{.*}}, i32 0
106f4a2713aSLionel Sambuc   return _mm256_extract_epi16(__a, 16);
107f4a2713aSLionel Sambuc }
108f4a2713aSLionel Sambuc 
test_extract_epi8(__m256i __a)109f4a2713aSLionel Sambuc int test_extract_epi8(__m256i __a) {
110f4a2713aSLionel Sambuc   // CHECK-LABEL: @test_extract_epi8
111f4a2713aSLionel Sambuc   // CHECK: extractelement <32 x i8> %{{.*}}, i32 0
112f4a2713aSLionel Sambuc   return _mm256_extract_epi8(__a, 32);
113f4a2713aSLionel Sambuc }
114*0a6a1f1dSLionel Sambuc 
test_256_blend_pd(__m256d __a,__m256d __b)115*0a6a1f1dSLionel Sambuc __m256d test_256_blend_pd(__m256d __a, __m256d __b) {
116*0a6a1f1dSLionel Sambuc   // CHECK-LABEL: @test_256_blend_pd
117*0a6a1f1dSLionel Sambuc   // CHECK: shufflevector <4 x double> %{{.*}}, <4 x double> %{{.*}}, <4 x i32> <i32 4, i32 1, i32 6, i32 3>
118*0a6a1f1dSLionel Sambuc   return _mm256_blend_pd(__a, __b, 0x35);
119*0a6a1f1dSLionel Sambuc }
120*0a6a1f1dSLionel Sambuc 
test_256_blend_ps(__m256 __a,__m256 __b)121*0a6a1f1dSLionel Sambuc __m256 test_256_blend_ps(__m256 __a, __m256 __b) {
122*0a6a1f1dSLionel Sambuc   // CHECK-LABEL: @test_256_blend_ps
123*0a6a1f1dSLionel Sambuc   // CHECK: shufflevector <8 x float> %{{.*}}, <8 x float> %{{.*}}, <8 x i32> <i32 8, i32 1, i32 10, i32 3, i32 12, i32 13, i32 6, i32 7>
124*0a6a1f1dSLionel Sambuc   return _mm256_blend_ps(__a, __b, 0x35);
125*0a6a1f1dSLionel Sambuc }
126