1 // RUN: %clang_cc1 -triple x86_64-apple-darwin -std=c++11 -emit-llvm -o - %s | FileCheck %s 2 3 // Verify while loop is recognized after sequence of pragma clang loop directives. 4 void while_test(int *List, int Length) { 5 // CHECK: define {{.*}} @_Z10while_test 6 int i = 0; 7 8 #pragma clang loop vectorize(enable) 9 #pragma clang loop interleave_count(4) 10 #pragma clang loop vectorize_width(4) 11 #pragma clang loop unroll(full) 12 #pragma clang loop distribute(enable) 13 while (i < Length) { 14 // CHECK: br label {{.*}}, !llvm.loop ![[LOOP_1:.*]] 15 List[i] = i * 2; 16 i++; 17 } 18 } 19 20 // Verify do loop is recognized after multi-option pragma clang loop directive. 21 void do_test(int *List, int Length) { 22 int i = 0; 23 24 #pragma clang loop vectorize_width(8) interleave_count(4) unroll(disable) distribute(disable) 25 do { 26 // CHECK: br i1 {{.*}}, label {{.*}}, label {{.*}}, !llvm.loop ![[LOOP_2:.*]] 27 List[i] = i * 2; 28 i++; 29 } while (i < Length); 30 } 31 32 enum struct Tuner : short { Interleave = 4, Unroll = 8 }; 33 34 // Verify for loop is recognized after sequence of pragma clang loop directives. 35 void for_test(int *List, int Length) { 36 #pragma clang loop interleave(enable) 37 #pragma clang loop interleave_count(static_cast<int>(Tuner::Interleave)) 38 #pragma clang loop unroll_count(static_cast<int>(Tuner::Unroll)) 39 for (int i = 0; i < Length; i++) { 40 // CHECK: br label {{.*}}, !llvm.loop ![[LOOP_3:.*]] 41 List[i] = i * 2; 42 } 43 } 44 45 // Verify c++11 for range loop is recognized after 46 // sequence of pragma clang loop directives. 47 void for_range_test() { 48 double List[100]; 49 50 #pragma clang loop vectorize_width(2) interleave_count(2) 51 for (int i : List) { 52 // CHECK: br label {{.*}}, !llvm.loop ![[LOOP_4:.*]] 53 List[i] = i; 54 } 55 } 56 57 // Verify disable pragma clang loop directive generates correct metadata 58 void disable_test(int *List, int Length) { 59 #pragma clang loop vectorize(disable) unroll(disable) distribute(disable) 60 for (int i = 0; i < Length; i++) { 61 // CHECK: br label {{.*}}, !llvm.loop ![[LOOP_5:.*]] 62 List[i] = i * 2; 63 } 64 } 65 66 #define VECWIDTH 2 67 #define INTCOUNT 2 68 #define UNROLLCOUNT 8 69 70 // Verify defines are correctly resolved in pragma clang loop directive 71 void for_define_test(int *List, int Length, int Value) { 72 #pragma clang loop vectorize_width(VECWIDTH) interleave_count(INTCOUNT) 73 #pragma clang loop unroll_count(UNROLLCOUNT) 74 for (int i = 0; i < Length; i++) { 75 // CHECK: br label {{.*}}, !llvm.loop ![[LOOP_6:.*]] 76 List[i] = i * Value; 77 } 78 } 79 80 // Verify constant expressions are handled correctly. 81 void for_contant_expression_test(int *List, int Length) { 82 #pragma clang loop vectorize_width(1 + 4) 83 for (int i = 0; i < Length; i++) { 84 // CHECK: br label {{.*}}, !llvm.loop ![[LOOP_7:.*]] 85 List[i] = i; 86 } 87 88 #pragma clang loop vectorize_width(3 + VECWIDTH) 89 for (int i = 0; i < Length; i++) { 90 // CHECK: br label {{.*}}, !llvm.loop ![[LOOP_8:.*]] 91 List[i] += i; 92 } 93 } 94 95 // Verify metadata is generated when template is used. 96 template <typename A> 97 void for_template_test(A *List, int Length, A Value) { 98 #pragma clang loop vectorize_width(8) interleave_count(8) unroll_count(8) 99 for (int i = 0; i < Length; i++) { 100 // CHECK: br label {{.*}}, !llvm.loop ![[LOOP_9:.*]] 101 List[i] = i * Value; 102 } 103 } 104 105 // Verify define is resolved correctly when template is used. 106 template <typename A, typename T> 107 void for_template_define_test(A *List, int Length, A Value) { 108 const T VWidth = VECWIDTH; 109 const T ICount = INTCOUNT; 110 const T UCount = UNROLLCOUNT; 111 #pragma clang loop vectorize_width(VWidth) interleave_count(ICount) 112 #pragma clang loop unroll_count(UCount) 113 for (int i = 0; i < Length; i++) { 114 // CHECK: br label {{.*}}, !llvm.loop ![[LOOP_10:.*]] 115 List[i] = i * Value; 116 } 117 } 118 119 // Verify templates and constant expressions are handled correctly. 120 template <typename A, int V, int I, int U> 121 void for_template_constant_expression_test(A *List, int Length) { 122 #pragma clang loop vectorize_width(V) interleave_count(I) unroll_count(U) 123 for (int i = 0; i < Length; i++) { 124 // CHECK: br label {{.*}}, !llvm.loop ![[LOOP_11:.*]] 125 List[i] = i; 126 } 127 128 #pragma clang loop vectorize_width(V * 2 + VECWIDTH) interleave_count(I * 2 + INTCOUNT) unroll_count(U * 2 + UNROLLCOUNT) 129 for (int i = 0; i < Length; i++) { 130 // CHECK: br label {{.*}}, !llvm.loop ![[LOOP_12:.*]] 131 List[i] += i; 132 } 133 134 const int Scale = 4; 135 #pragma clang loop vectorize_width(Scale * V) interleave_count(Scale * I) unroll_count(Scale * U) 136 for (int i = 0; i < Length; i++) { 137 // CHECK: br label {{.*}}, !llvm.loop ![[LOOP_13:.*]] 138 List[i] += i; 139 } 140 141 #pragma clang loop vectorize_width((Scale * V) + 2) 142 for (int i = 0; i < Length; i++) { 143 // CHECK: br label {{.*}}, !llvm.loop ![[LOOP_14:.*]] 144 List[i] += i; 145 } 146 } 147 148 #undef VECWIDTH 149 #undef INTCOUNT 150 #undef UNROLLCOUNT 151 152 // Use templates defined above. Test verifies metadata is generated correctly. 153 void template_test(double *List, int Length) { 154 double Value = 10; 155 156 for_template_test<double>(List, Length, Value); 157 for_template_define_test<double, int>(List, Length, Value); 158 for_template_constant_expression_test<double, 2, 4, 8>(List, Length); 159 } 160 161 void vec_width_1(int *List, int Length) { 162 // CHECK-LABEL: @{{.*}}vec_width_1{{.*}}( 163 // CHECK: br label {{.*}}, !llvm.loop ![[LOOP_15:.*]] 164 165 #pragma clang loop vectorize(enable) vectorize_width(1) 166 for (int i = 0; i < Length; i++) 167 List[i] = i * 2; 168 } 169 170 void width_1(int *List, int Length) { 171 // CHECK-LABEL: @{{.*}}width_1{{.*}}( 172 // CHECK: br label {{.*}}, !llvm.loop ![[LOOP_16:.*]] 173 174 #pragma clang loop vectorize_width(1) 175 for (int i = 0; i < Length; i++) 176 List[i] = i * 2; 177 } 178 179 // CHECK: ![[LOOP_1]] = distinct !{![[LOOP_1]], ![[UNROLL_FULL:.*]]} 180 // CHECK: ![[UNROLL_FULL]] = !{!"llvm.loop.unroll.full"} 181 182 // CHECK: ![[LOOP_2]] = distinct !{![[LOOP_2]], ![[UNROLL_DISABLE:.*]], ![[DISTRIBUTE_DISABLE:.*]], ![[VECTORIZE_ENABLE:.*]], ![[WIDTH_8:.*]], ![[INTERLEAVE_4:.*]]} 183 // CHECK: ![[UNROLL_DISABLE]] = !{!"llvm.loop.unroll.disable"} 184 // CHECK: ![[DISTRIBUTE_DISABLE]] = !{!"llvm.loop.distribute.enable", i1 false} 185 // CHECK: ![[VECTORIZE_ENABLE]] = !{!"llvm.loop.vectorize.enable", i1 true} 186 // CHECK: ![[WIDTH_8]] = !{!"llvm.loop.vectorize.width", i32 8} 187 // CHECK: ![[INTERLEAVE_4]] = !{!"llvm.loop.interleave.count", i32 4} 188 189 // CHECK: ![[LOOP_3]] = distinct !{![[LOOP_3]], ![[INTERLEAVE_4:.*]], ![[VECTORIZE_ENABLE]], ![[FOLLOWUP_VECTOR_3:.*]]} 190 // CHECK: ![[FOLLOWUP_VECTOR_3]] = !{!"llvm.loop.vectorize.followup_all", ![[AFTER_VECTOR_3:.*]]} 191 // CHECK: ![[AFTER_VECTOR_3]] = distinct !{![[AFTER_VECTOR_3]], ![[ISVECTORIZED:.*]], ![[UNROLL_8:.*]]} 192 // CHECK: ![[ISVECTORIZED]] = !{!"llvm.loop.isvectorized"} 193 // CHECK: ![[UNROLL_8]] = !{!"llvm.loop.unroll.count", i32 8} 194 195 // CHECK: ![[LOOP_4]] = distinct !{![[LOOP_4]], ![[VECTORIZE_ENABLE]], ![[WIDTH_2:.*]], ![[INTERLEAVE_2:.*]]} 196 // CHECK: ![[WIDTH_2]] = !{!"llvm.loop.vectorize.width", i32 2} 197 // CHECK: ![[INTERLEAVE_2]] = !{!"llvm.loop.interleave.count", i32 2} 198 199 // CHECK: ![[LOOP_5]] = distinct !{![[LOOP_5]], ![[UNROLL_DISABLE:.*]], ![[DISTRIBUTE_DISABLE:.*]], ![[WIDTH_1:.*]]} 200 // CHECK: ![[WIDTH_1]] = !{!"llvm.loop.vectorize.width", i32 1} 201 202 // CHECK: ![[LOOP_6]] = distinct !{![[LOOP_6]], ![[WIDTH_2:.*]], ![[INTERLEAVE_2:.*]], ![[FOLLOWUP_VECTOR_6:.*]]} 203 // CHECK: ![[FOLLOWUP_VECTOR_6]] = !{!"llvm.loop.vectorize.followup_all", ![[AFTER_VECTOR_6:.*]]} 204 // CHECK: ![[AFTER_VECTOR_6]] = distinct !{![[AFTER_VECTOR_6]], ![[ISVECTORIZED:.*]], ![[UNROLL_8:.*]]} 205 206 // CHECK: ![[LOOP_7]] = distinct !{![[LOOP_7]], ![[VECTORIZE_ENABLE]], ![[WIDTH_5:.*]]} 207 // CHECK: ![[WIDTH_5]] = !{!"llvm.loop.vectorize.width", i32 5} 208 209 // CHECK: ![[LOOP_8]] = distinct !{![[LOOP_8]], ![[WIDTH_5:.*]]} 210 211 // CHECK: ![[LOOP_9]] = distinct !{![[LOOP_9]], ![[WIDTH_8:.*]], ![[INTERLEAVE_8:.*]], ![[FOLLOWUP_VECTOR_9:.*]]} 212 // CHECK: ![[FOLLOWUP_VECTOR_9]] = !{!"llvm.loop.vectorize.followup_all", ![[AFTER_VECTOR_9:.*]]} 213 // CHECK: ![[AFTER_VECTOR_9]] = distinct !{![[AFTER_VECTOR_9]], ![[ISVECTORIZED:.*]], ![[UNROLL_8:.*]]} 214 215 // CHECK: ![[LOOP_10]] = distinct !{![[LOOP_10]], ![[WIDTH_2:.*]], ![[INTERLEAVE_2:.*]], ![[FOLLOWUP_VECTOR_10:.*]]} 216 // CHECK: ![[FOLLOWUP_VECTOR_10]] = !{!"llvm.loop.vectorize.followup_all", ![[AFTER_VECTOR_10:.*]]} 217 // CHECK: ![[AFTER_VECTOR_10]] = distinct !{![[AFTER_VECTOR_10]], ![[ISVECTORIZED:.*]], ![[UNROLL_8:.*]]} 218 219 // CHECK: ![[LOOP_11]] = distinct !{![[LOOP_11]], ![[WIDTH_2:.*]], ![[INTERLEAVE_4:.*]], ![[FOLLOWUP_VECTOR_11:.*]]} 220 // CHECK: ![[FOLLOWUP_VECTOR_11]] = !{!"llvm.loop.vectorize.followup_all", ![[AFTER_VECTOR_11:.*]]} 221 // CHECK: ![[AFTER_VECTOR_11]] = distinct !{![[AFTER_VECTOR_11]], ![[ISVECTORIZED:.*]], ![[UNROLL_8:.*]]} 222 223 // CHECK: ![[LOOP_12]] = distinct !{![[LOOP_12]], ![[WIDTH_6:.*]], ![[INTERLEAVE_10:.*]], ![[FOLLOWUP_VECTOR_12:.*]]} 224 // CHECK: ![[FOLLOWUP_VECTOR_12]] = !{!"llvm.loop.vectorize.followup_all", ![[AFTER_VECTOR_12:.*]]} 225 // CHECK: ![[AFTER_VECTOR_12]] = distinct !{![[AFTER_VECTOR_12]], ![[ISVECTORIZED:.*]], ![[UNROLL_24:.*]]} 226 // CHECK: ![[UNROLL_24]] = !{!"llvm.loop.unroll.count", i32 24} 227 228 // CHECK: ![[LOOP_13]] = distinct !{![[LOOP_13]], ![[WIDTH_8:.*]], ![[INTERLEAVE_16:.*]], ![[FOLLOWUP_VECTOR_13:.*]]} 229 // CHECK: ![[INTERLEAVE_16]] = !{!"llvm.loop.interleave.count", i32 16} 230 // CHECK: ![[FOLLOWUP_VECTOR_13]] = !{!"llvm.loop.vectorize.followup_all", ![[AFTER_VECTOR_13:.*]]} 231 // CHECK: ![[AFTER_VECTOR_13]] = distinct !{![[AFTER_VECTOR_13]], ![[ISVECTORIZED:.*]], ![[UNROLL_32:.*]]} 232 // CHECK: ![[UNROLL_32]] = !{!"llvm.loop.unroll.count", i32 32} 233 234 // CHECK: ![[LOOP_14]] = distinct !{![[LOOP_14]], ![[VECTORIZE_ENABLE]], ![[WIDTH_10:.*]]} 235 // CHECK: ![[WIDTH_10]] = !{!"llvm.loop.vectorize.width", i32 10} 236 237 // CHECK: ![[LOOP_15]] = distinct !{![[LOOP_15]], ![[WIDTH_1]], ![[VECTORIZE_ENABLE]]} 238 239 // CHECK-NEXT: ![[LOOP_16]] = distinct !{![[LOOP_16]], ![[VECTORIZE_ENABLE]], ![[WIDTH_1]]} 240