Chris Lattner | d6b84b9 | 2010-08-20 16:08:33 +0000 | [diff] [blame] | 1 | // RUN: %clang_cc1 -triple i386-apple-darwin9 -O1 -target-cpu pentium4 -target-feature +sse4.1 -g -emit-llvm %s -o - | FileCheck %s |
Anders Carlsson | 79b67f3 | 2008-02-01 23:17:55 +0000 | [diff] [blame] | 2 | typedef short __v4hi __attribute__ ((__vector_size__ (8))); |
| 3 | |
Chris Lattner | d077288 | 2009-10-17 20:37:18 +0000 | [diff] [blame] | 4 | void test1() { |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 5 | __v4hi A = (__v4hi)0LL; |
Anders Carlsson | 2cec15f | 2008-02-01 23:27:51 +0000 | [diff] [blame] | 6 | } |
Eli Friedman | cfb313b | 2008-05-30 12:02:14 +0000 | [diff] [blame] | 7 | |
| 8 | __v4hi x = {1,2,3}; |
| 9 | __v4hi y = {1,2,3,4}; |
Eli Friedman | daa24a2 | 2009-03-28 02:45:41 +0000 | [diff] [blame] | 10 | |
Eli Friedman | 3ded200 | 2009-03-28 03:14:28 +0000 | [diff] [blame] | 11 | typedef int vty __attribute((vector_size(16))); |
Chris Lattner | d077288 | 2009-10-17 20:37:18 +0000 | [diff] [blame] | 12 | int test2() { vty b; return b[2LL]; } |
Eli Friedman | 61d004a | 2009-06-06 19:09:26 +0000 | [diff] [blame] | 13 | |
| 14 | // PR4339 |
| 15 | typedef float vec4 __attribute__((vector_size(16))); |
| 16 | |
Chris Lattner | d077288 | 2009-10-17 20:37:18 +0000 | [diff] [blame] | 17 | void test3 ( vec4* a, char b, float c ) { |
Mike Stump | 1eb4433 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 18 | (*a)[b] = c; |
Eli Friedman | 61d004a | 2009-06-06 19:09:26 +0000 | [diff] [blame] | 19 | } |
Chris Lattner | d077288 | 2009-10-17 20:37:18 +0000 | [diff] [blame] | 20 | |
Bill Wendling | 80d56a9 | 2010-10-20 00:12:59 +0000 | [diff] [blame] | 21 | |
| 22 | |
| 23 | // Don't include mm_malloc.h, it's system specific. |
| 24 | #define __MM_MALLOC_H |
| 25 | |
Chris Lattner | d077288 | 2009-10-17 20:37:18 +0000 | [diff] [blame] | 26 | #include <mmintrin.h> |
| 27 | |
| 28 | int test4(int argc, char *argv[]) { |
| 29 | int array[16] = { 0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15 }; |
| 30 | __m64 *p = (__m64 *)array; |
| 31 | |
| 32 | __m64 accum = _mm_setzero_si64(); |
| 33 | |
| 34 | for (int i=0; i<8; ++i) |
| 35 | accum = _mm_add_pi32(p[i], accum); |
| 36 | |
| 37 | __m64 accum2 = _mm_unpackhi_pi32(accum, accum); |
| 38 | accum = _mm_add_pi32(accum, accum2); |
| 39 | |
| 40 | int result = _mm_cvtsi64_si32(accum); |
| 41 | _mm_empty(); |
| 42 | |
| 43 | return result; |
| 44 | } |
Chris Lattner | d6b84b9 | 2010-08-20 16:08:33 +0000 | [diff] [blame] | 45 | |
| 46 | #include <smmintrin.h> |
| 47 | |
| 48 | unsigned long test_epi8(__m128i x) { return _mm_extract_epi8(x, 4); } |
| 49 | // CHECK: @test_epi8 |
| 50 | // CHECK: extractelement <16 x i8> {{.*}}, i32 4 |
| 51 | // CHECK: zext i8 {{.*}} to i32 |
| 52 | |
| 53 | unsigned long test_epi16(__m128i x) { return _mm_extract_epi16(x, 3); } |
| 54 | |
| 55 | // CHECK: @test_epi16 |
| 56 | // CHECK: extractelement <8 x i16> {{.*}}, i32 3 |
| 57 | // CHECK: zext i16 {{.*}} to i32 |