forked from OSchip/llvm-project
65 lines
1.6 KiB
C
65 lines
1.6 KiB
C
// RUN: %clang_cc1 -triple i386-apple-darwin9 -O1 -target-cpu pentium4 -target-feature +sse4.1 -g -emit-llvm %s -o - | FileCheck %s
|
|
typedef short __v4hi __attribute__ ((__vector_size__ (8)));
|
|
|
|
void test1() {
|
|
__v4hi A = (__v4hi)0LL;
|
|
}
|
|
|
|
__v4hi x = {1,2,3};
|
|
__v4hi y = {1,2,3,4};
|
|
|
|
typedef int vty __attribute((vector_size(16)));
|
|
int test2() { vty b; return b[2LL]; }
|
|
|
|
// PR4339
|
|
typedef float vec4 __attribute__((vector_size(16)));
|
|
|
|
void test3 ( vec4* a, char b, float c ) {
|
|
(*a)[b] = c;
|
|
}
|
|
|
|
|
|
|
|
// Don't include mm_malloc.h, it's system specific.
|
|
#define __MM_MALLOC_H
|
|
|
|
#include <mmintrin.h>
|
|
|
|
int test4(int argc, char *argv[]) {
|
|
int array[16] = { 0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15 };
|
|
__m64 *p = (__m64 *)array;
|
|
|
|
__m64 accum = _mm_setzero_si64();
|
|
|
|
for (int i=0; i<8; ++i)
|
|
accum = _mm_add_pi32(p[i], accum);
|
|
|
|
__m64 accum2 = _mm_unpackhi_pi32(accum, accum);
|
|
accum = _mm_add_pi32(accum, accum2);
|
|
|
|
int result = _mm_cvtsi64_si32(accum);
|
|
_mm_empty();
|
|
|
|
return result;
|
|
}
|
|
|
|
#include <smmintrin.h>
|
|
|
|
unsigned long test_epi8(__m128i x) { return _mm_extract_epi8(x, 4); }
|
|
// CHECK: @test_epi8
|
|
// CHECK: extractelement <16 x i8> {{.*}}, i32 4
|
|
// CHECK: zext i8 {{.*}} to i32
|
|
|
|
unsigned long test_epi16(__m128i x) { return _mm_extract_epi16(x, 3); }
|
|
|
|
// CHECK: @test_epi16
|
|
// CHECK: extractelement <8 x i16> {{.*}}, i32 3
|
|
// CHECK: zext i16 {{.*}} to i32
|
|
|
|
void extractinttypes() {
|
|
extern int check_extract_result_int;
|
|
extern __typeof(_mm_extract_epi8(_mm_setzero_si128(), 3)) check_result_int;
|
|
extern __typeof(_mm_extract_epi16(_mm_setzero_si128(), 3)) check_result_int;
|
|
extern __typeof(_mm_extract_epi32(_mm_setzero_si128(), 3)) check_result_int;
|
|
}
|