| // RUN: %clang_cc1 -ffreestanding %s -triple=x86_64-apple-darwin -target-feature +bmi -emit-llvm -o - -Wall -Werror | FileCheck %s |
| |
| |
| #include <immintrin.h> |
| |
| // NOTE: This should match the tests in llvm/test/CodeGen/X86/bmi-intrinsics-fast-isel.ll |
| |
| // The double underscore intrinsics are for compatibility with |
| // AMD's BMI interface. The single underscore intrinsics |
| // are for compatibility with Intel's BMI interface. |
| // Apart from the underscores, the interfaces are identical |
| // except in one case: although the 'bextr' register-form |
| // instruction is identical in hardware, the AMD and Intel |
| // intrinsics are different! |
| |
| unsigned short test__tzcnt_u16(unsigned short __X) { |
| // CHECK-LABEL: test__tzcnt_u16 |
| // CHECK: zext i16 %{{.*}} to i32 |
| // CHECK: icmp ne i32 %{{.*}}, 0 |
| // CHECK: i16 @llvm.cttz.i16(i16 %{{.*}}, i1 true) |
| return __tzcnt_u16(__X); |
| } |
| |
| unsigned int test__andn_u32(unsigned int __X, unsigned int __Y) { |
| // CHECK-LABEL: test__andn_u32 |
| // CHECK: xor i32 %{{.*}}, -1 |
| // CHECK: and i32 %{{.*}}, %{{.*}} |
| return __andn_u32(__X, __Y); |
| } |
| |
| unsigned int test__bextr_u32(unsigned int __X, unsigned int __Y) { |
| // CHECK-LABEL: test__bextr_u32 |
| // CHECK: i32 @llvm.x86.bmi.bextr.32(i32 %{{.*}}, i32 %{{.*}}) |
| return __bextr_u32(__X, __Y); |
| } |
| |
| unsigned int test__blsi_u32(unsigned int __X) { |
| // CHECK-LABEL: test__blsi_u32 |
| // CHECK: sub i32 0, %{{.*}} |
| // CHECK: and i32 %{{.*}}, %{{.*}} |
| return __blsi_u32(__X); |
| } |
| |
| unsigned int test__blsmsk_u32(unsigned int __X) { |
| // CHECK-LABEL: test__blsmsk_u32 |
| // CHECK: sub i32 %{{.*}}, 1 |
| // CHECK: xor i32 %{{.*}}, %{{.*}} |
| return __blsmsk_u32(__X); |
| } |
| |
| unsigned int test__blsr_u32(unsigned int __X) { |
| // CHECK-LABEL: test__blsr_u32 |
| // CHECK: sub i32 %{{.*}}, 1 |
| // CHECK: and i32 %{{.*}}, %{{.*}} |
| return __blsr_u32(__X); |
| } |
| |
| unsigned int test__tzcnt_u32(unsigned int __X) { |
| // CHECK-LABEL: test__tzcnt_u32 |
| // CHECK: icmp ne i32 %{{.*}}, 0 |
| // CHECK: i32 @llvm.cttz.i32(i32 %{{.*}}, i1 true) |
| return __tzcnt_u32(__X); |
| } |
| |
| int test_mm_tzcnt_32(unsigned int __X) { |
| // CHECK-LABEL: test_mm_tzcnt_32 |
| // CHECK: icmp ne i32 %{{.*}}, 0 |
| // CHECK: i32 @llvm.cttz.i32(i32 %{{.*}}, i1 true) |
| return _mm_tzcnt_32(__X); |
| } |
| |
| unsigned long long test__andn_u64(unsigned long __X, unsigned long __Y) { |
| // CHECK-LABEL: test__andn_u64 |
| // CHECK: xor i64 %{{.*}}, -1 |
| // CHECK: and i64 %{{.*}}, %{{.*}} |
| return __andn_u64(__X, __Y); |
| } |
| |
| unsigned long long test__bextr_u64(unsigned long __X, unsigned long __Y) { |
| // CHECK-LABEL: test__bextr_u64 |
| // CHECK: i64 @llvm.x86.bmi.bextr.64(i64 %{{.*}}, i64 %{{.*}}) |
| return __bextr_u64(__X, __Y); |
| } |
| |
| unsigned long long test__blsi_u64(unsigned long long __X) { |
| // CHECK-LABEL: test__blsi_u64 |
| // CHECK: sub i64 0, %{{.*}} |
| // CHECK: and i64 %{{.*}}, %{{.*}} |
| return __blsi_u64(__X); |
| } |
| |
| unsigned long long test__blsmsk_u64(unsigned long long __X) { |
| // CHECK-LABEL: test__blsmsk_u64 |
| // CHECK: sub i64 %{{.*}}, 1 |
| // CHECK: xor i64 %{{.*}}, %{{.*}} |
| return __blsmsk_u64(__X); |
| } |
| |
| unsigned long long test__blsr_u64(unsigned long long __X) { |
| // CHECK-LABEL: test__blsr_u64 |
| // CHECK: sub i64 %{{.*}}, 1 |
| // CHECK: and i64 %{{.*}}, %{{.*}} |
| return __blsr_u64(__X); |
| } |
| |
| unsigned long long test__tzcnt_u64(unsigned long long __X) { |
| // CHECK-LABEL: test__tzcnt_u64 |
| // CHECK: icmp ne i64 %{{.*}}, 0 |
| // CHECK: i64 @llvm.cttz.i64(i64 %{{.*}}, i1 true) |
| return __tzcnt_u64(__X); |
| } |
| |
| long long test_mm_tzcnt_64(unsigned long long __X) { |
| // CHECK-LABEL: test_mm_tzcnt_64 |
| // CHECK: icmp ne i64 %{{.*}}, 0 |
| // CHECK: i64 @llvm.cttz.i64(i64 %{{.*}}, i1 true) |
| return _mm_tzcnt_64(__X); |
| } |
| |
| // Intel intrinsics |
| |
| unsigned short test_tzcnt_u16(unsigned short __X) { |
| // CHECK-LABEL: test_tzcnt_u16 |
| // CHECK: zext i16 %{{.*}} to i32 |
| // CHECK: icmp ne i32 %{{.*}}, 0 |
| // CHECK: i16 @llvm.cttz.i16(i16 %{{.*}}, i1 true) |
| return _tzcnt_u16(__X); |
| } |
| |
| unsigned int test_andn_u32(unsigned int __X, unsigned int __Y) { |
| // CHECK-LABEL: test_andn_u32 |
| // CHECK: xor i32 %{{.*}}, -1 |
| // CHECK: and i32 %{{.*}}, %{{.*}} |
| return _andn_u32(__X, __Y); |
| } |
| |
| unsigned int test_bextr_u32(unsigned int __X, unsigned int __Y, |
| unsigned int __Z) { |
| // CHECK-LABEL: test_bextr_u32 |
| // CHECK: and i32 %{{.*}}, 255 |
| // CHECK: and i32 %{{.*}}, 255 |
| // CHECK: shl i32 %{{.*}}, 8 |
| // CHECK: or i32 %{{.*}}, %{{.*}} |
| // CHECK: i32 @llvm.x86.bmi.bextr.32(i32 %{{.*}}, i32 %{{.*}}) |
| return _bextr_u32(__X, __Y, __Z); |
| } |
| |
| unsigned int test_blsi_u32(unsigned int __X) { |
| // CHECK-LABEL: test_blsi_u32 |
| // CHECK: sub i32 0, %{{.*}} |
| // CHECK: and i32 %{{.*}}, %{{.*}} |
| return _blsi_u32(__X); |
| } |
| |
| unsigned int test_blsmsk_u32(unsigned int __X) { |
| // CHECK-LABEL: test_blsmsk_u32 |
| // CHECK: sub i32 %{{.*}}, 1 |
| // CHECK: xor i32 %{{.*}}, %{{.*}} |
| return _blsmsk_u32(__X); |
| } |
| |
| unsigned int test_blsr_u32(unsigned int __X) { |
| // CHECK-LABEL: test_blsr_u32 |
| // CHECK: sub i32 %{{.*}}, 1 |
| // CHECK: and i32 %{{.*}}, %{{.*}} |
| return _blsr_u32(__X); |
| } |
| |
| unsigned int test_tzcnt_u32(unsigned int __X) { |
| // CHECK-LABEL: test_tzcnt_u32 |
| // CHECK: icmp ne i32 %{{.*}}, 0 |
| // CHECK: i32 @llvm.cttz.i32(i32 %{{.*}}, i1 true) |
| return _tzcnt_u32(__X); |
| } |
| |
| unsigned long long test_andn_u64(unsigned long __X, unsigned long __Y) { |
| // CHECK-LABEL: test_andn_u64 |
| // CHECK: xor i64 %{{.*}}, -1 |
| // CHECK: and i64 %{{.*}}, %{{.*}} |
| return _andn_u64(__X, __Y); |
| } |
| |
| unsigned long long test_bextr_u64(unsigned long __X, unsigned int __Y, |
| unsigned int __Z) { |
| // CHECK-LABEL: test_bextr_u64 |
| // CHECK: and i32 %{{.*}}, 255 |
| // CHECK: and i32 %{{.*}}, 255 |
| // CHECK: shl i32 %{{.*}}, 8 |
| // CHECK: or i32 %{{.*}}, %{{.*}} |
| // CHECK: zext i32 %{{.*}} to i64 |
| // CHECK: i64 @llvm.x86.bmi.bextr.64(i64 %{{.*}}, i64 %{{.*}}) |
| return _bextr_u64(__X, __Y, __Z); |
| } |
| |
| unsigned long long test_blsi_u64(unsigned long long __X) { |
| // CHECK-LABEL: test_blsi_u64 |
| // CHECK: sub i64 0, %{{.*}} |
| // CHECK: and i64 %{{.*}}, %{{.*}} |
| return _blsi_u64(__X); |
| } |
| |
| unsigned long long test_blsmsk_u64(unsigned long long __X) { |
| // CHECK-LABEL: test_blsmsk_u64 |
| // CHECK: sub i64 %{{.*}}, 1 |
| // CHECK: xor i64 %{{.*}}, %{{.*}} |
| return _blsmsk_u64(__X); |
| } |
| |
| unsigned long long test_blsr_u64(unsigned long long __X) { |
| // CHECK-LABEL: test_blsr_u64 |
| // CHECK: sub i64 %{{.*}}, 1 |
| // CHECK: and i64 %{{.*}}, %{{.*}} |
| return _blsr_u64(__X); |
| } |
| |
| unsigned long long test_tzcnt_u64(unsigned long long __X) { |
| // CHECK-LABEL: test_tzcnt_u64 |
| // CHECK: icmp ne i64 %{{.*}}, 0 |
| // CHECK: i64 @llvm.cttz.i64(i64 %{{.*}}, i1 true) |
| return _tzcnt_u64(__X); |
| } |