C++程序  |  560行  |  15.11 KB

// RUN: %clang_cc1 -triple arm64-apple-ios7.0 -target-feature +neon -ffreestanding -Os -S -o - %s | FileCheck %s
// REQUIRES: aarch64-registered-target

#include <arm_neon.h>

int16x8_t test_vaddw_high_s8(int16x8_t lhs, int8x16_t rhs) {
  // CHECK: saddw2.8h
  return vaddw_high_s8(lhs, rhs);
}

int32x4_t test_vaddw_high_s16(int32x4_t lhs, int16x8_t rhs) {
  // CHECK: saddw2.4s
  return vaddw_high_s16(lhs, rhs);
}

int64x2_t test_vaddw_high_s32(int64x2_t lhs, int32x4_t rhs) {
  // CHECK: saddw2.2d
  return vaddw_high_s32(lhs, rhs);
}

uint16x8_t test_vaddw_high_u8(uint16x8_t lhs, uint8x16_t rhs) {
  // CHECK: uaddw2.8h
  return vaddw_high_u8(lhs, rhs);
}

uint32x4_t test_vaddw_high_u16(uint32x4_t lhs, uint16x8_t rhs) {
  // CHECK: uaddw2.4s
  return vaddw_high_u16(lhs, rhs);
}

uint64x2_t test_vaddw_high_u32(uint64x2_t lhs, uint32x4_t rhs) {
  // CHECK: uaddw2.2d
  return vaddw_high_u32(lhs, rhs);
}

int16x8_t test_vsubw_high_s8(int16x8_t lhs, int8x16_t rhs) {
  // CHECK: ssubw2.8h
  return vsubw_high_s8(lhs, rhs);
}

int32x4_t test_vsubw_high_s16(int32x4_t lhs, int16x8_t rhs) {
  // CHECK: ssubw2.4s
  return vsubw_high_s16(lhs, rhs);
}

int64x2_t test_vsubw_high_s32(int64x2_t lhs, int32x4_t rhs) {
  // CHECK: ssubw2.2d
  return vsubw_high_s32(lhs, rhs);
}

uint16x8_t test_vsubw_high_u8(uint16x8_t lhs, uint8x16_t rhs) {
  // CHECK: usubw2.8h
  return vsubw_high_u8(lhs, rhs);
}

uint32x4_t test_vsubw_high_u16(uint32x4_t lhs, uint16x8_t rhs) {
  // CHECK: usubw2.4s
  return vsubw_high_u16(lhs, rhs);
}

uint64x2_t test_vsubw_high_u32(uint64x2_t lhs, uint32x4_t rhs) {
  // CHECK: usubw2.2d
  return vsubw_high_u32(lhs, rhs);
}

int16x8_t test_vabdl_high_s8(int8x16_t lhs, int8x16_t rhs) {
  // CHECK: sabdl2.8h
  return vabdl_high_s8(lhs, rhs);
}

int32x4_t test_vabdl_high_s16(int16x8_t lhs, int16x8_t rhs) {
  // CHECK: sabdl2.4s
  return vabdl_high_s16(lhs, rhs);
}

int64x2_t test_vabdl_high_s32(int32x4_t lhs, int32x4_t rhs) {
  // CHECK: sabdl2.2d
  return vabdl_high_s32(lhs, rhs);
}

uint16x8_t test_vabdl_high_u8(uint8x16_t lhs, uint8x16_t rhs) {
  // CHECK: uabdl2.8h
  return vabdl_high_u8(lhs, rhs);
}

uint32x4_t test_vabdl_high_u16(uint16x8_t lhs, uint16x8_t rhs) {
  // CHECK: uabdl2.4s
  return vabdl_high_u16(lhs, rhs);
}

uint64x2_t test_vabdl_high_u32(uint32x4_t lhs, uint32x4_t rhs) {
  // CHECK: uabdl2.2d
  return vabdl_high_u32(lhs, rhs);
}

int16x8_t test_vabal_high_s8(int16x8_t accum, int8x16_t lhs, int8x16_t rhs) {
  // CHECK: sabal2.8h
  return vabal_high_s8(accum, lhs, rhs);
}

int32x4_t test_vabal_high_s16(int32x4_t accum, int16x8_t lhs, int16x8_t rhs) {
  // CHECK: sabal2.4s
  return vabal_high_s16(accum, lhs, rhs);
}

int64x2_t test_vabal_high_s32(int64x2_t accum, int32x4_t lhs, int32x4_t rhs) {
  // CHECK: sabal2.2d
  return vabal_high_s32(accum, lhs, rhs);
}

uint16x8_t test_vabal_high_u8(uint16x8_t accum, uint8x16_t lhs, uint8x16_t rhs) {
  // CHECK: uabal2.8h
  return vabal_high_u8(accum, lhs, rhs);
}

uint32x4_t test_vabal_high_u16(uint32x4_t accum, uint16x8_t lhs, uint16x8_t rhs) {
  // CHECK: uabal2.4s
  return vabal_high_u16(accum, lhs, rhs);
}

uint64x2_t test_vabal_high_u32(uint64x2_t accum, uint32x4_t lhs, uint32x4_t rhs) {
  // CHECK: uabal2.2d
  return vabal_high_u32(accum, lhs, rhs);
}

int32x4_t test_vqdmlal_high_s16(int32x4_t accum, int16x8_t lhs, int16x8_t rhs) {
  // CHECK: sqdmlal2.4s
  return vqdmlal_high_s16(accum, lhs, rhs);
}

int64x2_t test_vqdmlal_high_s32(int64x2_t accum, int32x4_t lhs, int32x4_t rhs) {
  // CHECK: sqdmlal2.2d
  return vqdmlal_high_s32(accum, lhs, rhs);
}

int32x4_t test_vqdmlsl_high_s16(int32x4_t accum, int16x8_t lhs, int16x8_t rhs) {
  // CHECK: sqdmlsl2.4s
  return vqdmlsl_high_s16(accum, lhs, rhs);
}

int64x2_t test_vqdmlsl_high_s32(int64x2_t accum, int32x4_t lhs, int32x4_t rhs) {
  // CHECK: sqdmlsl2.2d
  return vqdmlsl_high_s32(accum, lhs, rhs);
}

int32x4_t test_vqdmull_high_s16(int16x8_t lhs, int16x8_t rhs) {
  // CHECK: sqdmull2.4s
  return vqdmull_high_s16(lhs, rhs);
}

int64x2_t test_vqdmull_high_s32(int32x4_t lhs, int32x4_t rhs) {
  // CHECK: sqdmull2.2d
  return vqdmull_high_s32(lhs, rhs);
}

int16x8_t test_vshll_high_n_s8(int8x16_t in) {
  // CHECK: sshll2.8h
  return vshll_high_n_s8(in, 7);
}

int32x4_t test_vshll_high_n_s16(int16x8_t in) {
  // CHECK: sshll2.4s
  return vshll_high_n_s16(in, 15);
}

int64x2_t test_vshll_high_n_s32(int32x4_t in) {
  // CHECK: sshll2.2d
  return vshll_high_n_s32(in, 31);
}

int16x8_t test_vshll_high_n_u8(int8x16_t in) {
  // CHECK: ushll2.8h
  return vshll_high_n_u8(in, 7);
}

int32x4_t test_vshll_high_n_u16(int16x8_t in) {
  // CHECK: ushll2.4s
  return vshll_high_n_u16(in, 15);
}

int64x2_t test_vshll_high_n_u32(int32x4_t in) {
  // CHECK: ushll2.2d
  return vshll_high_n_u32(in, 31);
}

int16x8_t test_vshll_high_n_s8_max(int8x16_t in) {
  // CHECK: shll2.8h
  return vshll_high_n_s8(in, 8);
}

int32x4_t test_vshll_high_n_s16_max(int16x8_t in) {
  // CHECK: shll2.4s
  return vshll_high_n_s16(in, 16);
}

int64x2_t test_vshll_high_n_s32_max(int32x4_t in) {
  // CHECK: shll2.2d
  return vshll_high_n_s32(in, 32);
}

int16x8_t test_vshll_high_n_u8_max(int8x16_t in) {
  // CHECK: shll2.8h
  return vshll_high_n_u8(in, 8);
}

int32x4_t test_vshll_high_n_u16_max(int16x8_t in) {
  // CHECK: shll2.4s
  return vshll_high_n_u16(in, 16);
}

int64x2_t test_vshll_high_n_u32_max(int32x4_t in) {
  // CHECK: shll2.2d
  return vshll_high_n_u32(in, 32);
}

int16x8_t test_vsubl_high_s8(int8x16_t lhs, int8x16_t rhs) {
  // CHECK: ssubl2.8h
  return vsubl_high_s8(lhs, rhs);
}

int32x4_t test_vsubl_high_s16(int16x8_t lhs, int16x8_t rhs) {
  // CHECK: ssubl2.4s
  return vsubl_high_s16(lhs, rhs);
}

int64x2_t test_vsubl_high_s32(int32x4_t lhs, int32x4_t rhs) {
  // CHECK: ssubl2.2d
  return vsubl_high_s32(lhs, rhs);
}

uint16x8_t test_vsubl_high_u8(uint8x16_t lhs, uint8x16_t rhs) {
  // CHECK: usubl2.8h
  return vsubl_high_u8(lhs, rhs);
}

uint32x4_t test_vsubl_high_u16(uint16x8_t lhs, uint16x8_t rhs) {
  // CHECK: usubl2.4s
  return vsubl_high_u16(lhs, rhs);
}

uint64x2_t test_vsubl_high_u32(uint32x4_t lhs, uint32x4_t rhs) {
  // CHECK: usubl2.2d
  return vsubl_high_u32(lhs, rhs);
}

int8x16_t test_vrshrn_high_n_s16(int8x8_t lowpart, int16x8_t input) {
  // CHECK: rshrn2.16b
  return vrshrn_high_n_s16(lowpart, input, 2);
}

int16x8_t test_vrshrn_high_n_s32(int16x4_t lowpart, int32x4_t input) {
  // CHECK: rshrn2.8h
  return vrshrn_high_n_s32(lowpart, input, 2);
}

int32x4_t test_vrshrn_high_n_s64(int32x2_t lowpart, int64x2_t input) {
  // CHECK: shrn2.4s
  return vrshrn_high_n_s64(lowpart, input, 2);
}

uint8x16_t test_vrshrn_high_n_u16(uint8x8_t lowpart, uint16x8_t input) {
  // CHECK: rshrn2.16b
  return vrshrn_high_n_u16(lowpart, input, 2);
}

uint16x8_t test_vrshrn_high_n_u32(uint16x4_t lowpart, uint32x4_t input) {
  // CHECK: rshrn2.8h
  return vrshrn_high_n_u32(lowpart, input, 2);
}

uint32x4_t test_vrshrn_high_n_u64(uint32x2_t lowpart, uint64x2_t input) {
  // CHECK: rshrn2.4s
  return vrshrn_high_n_u64(lowpart, input, 2);
}

int8x16_t test_vshrn_high_n_s16(int8x8_t lowpart, int16x8_t input) {
  // CHECK: shrn2.16b
  return vshrn_high_n_s16(lowpart, input, 2);
}

int16x8_t test_vshrn_high_n_s32(int16x4_t lowpart, int32x4_t input) {
  // CHECK: shrn2.8h
  return vshrn_high_n_s32(lowpart, input, 2);
}

int32x4_t test_vshrn_high_n_s64(int32x2_t lowpart, int64x2_t input) {
  // CHECK: shrn2.4s
  return vshrn_high_n_s64(lowpart, input, 2);
}

uint8x16_t test_vshrn_high_n_u16(uint8x8_t lowpart, uint16x8_t input) {
  // CHECK: shrn2.16b
  return vshrn_high_n_u16(lowpart, input, 2);
}

uint16x8_t test_vshrn_high_n_u32(uint16x4_t lowpart, uint32x4_t input) {
  // CHECK: shrn2.8h
  return vshrn_high_n_u32(lowpart, input, 2);
}

uint32x4_t test_vshrn_high_n_u64(uint32x2_t lowpart, uint64x2_t input) {
  // CHECK: shrn2.4s
  return vshrn_high_n_u64(lowpart, input, 2);
}

uint8x16_t test_vqshrun_high_n_s16(uint8x8_t lowpart, int16x8_t input) {
  // CHECK: sqshrun2.16b
  return vqshrun_high_n_s16(lowpart, input, 2);
}

uint16x8_t test_vqshrun_high_n_s32(uint16x4_t lowpart, int32x4_t input) {
  // CHECK: sqshrun2.8h
  return vqshrun_high_n_s32(lowpart, input, 2);
}

uint32x4_t test_vqshrun_high_n_s64(uint32x2_t lowpart, int64x2_t input) {
  // CHECK: sqshrun2.4s
  return vqshrun_high_n_s64(lowpart, input, 2);
}

uint8x16_t test_vqrshrun_high_n_s16(uint8x8_t lowpart, int16x8_t input) {
  // CHECK: sqrshrun2.16b
  return vqrshrun_high_n_s16(lowpart, input, 2);
}

uint16x8_t test_vqrshrun_high_n_s32(uint16x4_t lowpart, int32x4_t input) {
  // CHECK: sqrshrun2.8h
  return vqrshrun_high_n_s32(lowpart, input, 2);
}

uint32x4_t test_vqrshrun_high_n_s64(uint32x2_t lowpart, int64x2_t input) {
  // CHECK: sqrshrun2.4s
  return vqrshrun_high_n_s64(lowpart, input, 2);
}

int8x16_t test_vqshrn_high_n_s16(int8x8_t lowpart, int16x8_t input) {
  // CHECK: sqshrn2.16b
  return vqshrn_high_n_s16(lowpart, input, 2);
}

int16x8_t test_vqshrn_high_n_s32(int16x4_t lowpart, int32x4_t input) {
  // CHECK: sqshrn2.8h
  return vqshrn_high_n_s32(lowpart, input, 2);
}

int32x4_t test_vqshrn_high_n_s64(int32x2_t lowpart, int64x2_t input) {
  // CHECK: sqshrn2.4s
  return vqshrn_high_n_s64(lowpart, input, 2);
}

uint8x16_t test_vqshrn_high_n_u16(uint8x8_t lowpart, uint16x8_t input) {
  // CHECK: uqshrn2.16b
  return vqshrn_high_n_u16(lowpart, input, 2);
}

uint16x8_t test_vqshrn_high_n_u32(uint16x4_t lowpart, uint32x4_t input) {
  // CHECK: uqshrn2.8h
  return vqshrn_high_n_u32(lowpart, input, 2);
}

uint32x4_t test_vqshrn_high_n_u64(uint32x2_t lowpart, uint64x2_t input) {
  // CHECK: uqshrn2.4s
  return vqshrn_high_n_u64(lowpart, input, 2);
}

int8x16_t test_vqrshrn_high_n_s16(int8x8_t lowpart, int16x8_t input) {
  // CHECK: sqrshrn2.16b
  return vqrshrn_high_n_s16(lowpart, input, 2);
}

int16x8_t test_vqrshrn_high_n_s32(int16x4_t lowpart, int32x4_t input) {
  // CHECK: sqrshrn2.8h
  return vqrshrn_high_n_s32(lowpart, input, 2);
}

int32x4_t test_vqrshrn_high_n_s64(int32x2_t lowpart, int64x2_t input) {
  // CHECK: sqrshrn2.4s
  return vqrshrn_high_n_s64(lowpart, input, 2);
}

uint8x16_t test_vqrshrn_high_n_u16(uint8x8_t lowpart, uint16x8_t input) {
  // CHECK: uqrshrn2.16b
  return vqrshrn_high_n_u16(lowpart, input, 2);
}

uint16x8_t test_vqrshrn_high_n_u32(uint16x4_t lowpart, uint32x4_t input) {
  // CHECK: uqrshrn2.8h
  return vqrshrn_high_n_u32(lowpart, input, 2);
}

uint32x4_t test_vqrshrn_high_n_u64(uint32x2_t lowpart, uint64x2_t input) {
  // CHECK: uqrshrn2.4s
  return vqrshrn_high_n_u64(lowpart, input, 2);
}

int8x16_t test_vaddhn_high_s16(int8x8_t lowpart, int16x8_t lhs, int16x8_t rhs) {
  // CHECK: addhn2.16b v0, {{v1, v2|v2, v1}}
  return vaddhn_high_s16(lowpart, lhs, rhs);
}

int16x8_t test_vaddhn_high_s32(int16x4_t lowpart, int32x4_t lhs, int32x4_t rhs) {
  // CHECK: addhn2.8h v0, {{v1, v2|v2, v1}}
  return vaddhn_high_s32(lowpart, lhs, rhs);
}

int32x4_t test_vaddhn_high_s64(int32x2_t lowpart, int64x2_t lhs, int64x2_t rhs) {
  // CHECK: addhn2.4s v0, {{v1, v2|v2, v1}}
  return vaddhn_high_s64(lowpart, lhs, rhs);
}

uint8x16_t test_vaddhn_high_u16(uint8x8_t lowpart, uint16x8_t lhs, uint16x8_t rhs) {
  // CHECK: addhn2.16b v0, {{v1, v2|v2, v1}}
  return vaddhn_high_s16(lowpart, lhs, rhs);
}

uint16x8_t test_vaddhn_high_u32(uint16x4_t lowpart, uint32x4_t lhs, uint32x4_t rhs) {
  // CHECK: addhn2.8h v0, {{v1, v2|v2, v1}}
  return vaddhn_high_s32(lowpart, lhs, rhs);
}

uint32x4_t test_vaddhn_high_u64(uint32x2_t lowpart, uint64x2_t lhs, uint64x2_t rhs) {
  // CHECK: addhn2.4s v0, {{v1, v2|v2, v1}}
  return vaddhn_high_s64(lowpart, lhs, rhs);
}

int8x16_t test_vraddhn_high_s16(int8x8_t lowpart, int16x8_t lhs, int16x8_t rhs) {
  // CHECK: raddhn2.16b v0, v1, v2
  return vraddhn_high_s16(lowpart, lhs, rhs);
}

int16x8_t test_vraddhn_high_s32(int16x4_t lowpart, int32x4_t lhs, int32x4_t rhs) {
  // CHECK: raddhn2.8h v0, v1, v2
  return vraddhn_high_s32(lowpart, lhs, rhs);
}

int32x4_t test_vraddhn_high_s64(int32x2_t lowpart, int64x2_t lhs, int64x2_t rhs) {
  // CHECK: raddhn2.4s v0, v1, v2
  return vraddhn_high_s64(lowpart, lhs, rhs);
}

uint8x16_t test_vraddhn_high_u16(uint8x8_t lowpart, uint16x8_t lhs, uint16x8_t rhs) {
  // CHECK: raddhn2.16b v0, v1, v2
  return vraddhn_high_s16(lowpart, lhs, rhs);
}

uint16x8_t test_vraddhn_high_u32(uint16x4_t lowpart, uint32x4_t lhs, uint32x4_t rhs) {
  // CHECK: raddhn2.8h v0, v1, v2
  return vraddhn_high_s32(lowpart, lhs, rhs);
}

uint32x4_t test_vraddhn_high_u64(uint32x2_t lowpart, uint64x2_t lhs, uint64x2_t rhs) {
  // CHECK: raddhn2.4s v0, v1, v2
  return vraddhn_high_s64(lowpart, lhs, rhs);
}

int8x16_t test_vmovn_high_s16(int8x8_t lowpart, int16x8_t wide) {
  // CHECK: xtn2.16b v0, v1
  return vmovn_high_s16(lowpart, wide);
}

int16x8_t test_vmovn_high_s32(int16x4_t lowpart, int32x4_t wide) {
  // CHECK: xtn2.8h v0, v1
  return vmovn_high_s32(lowpart, wide);
}

int32x4_t test_vmovn_high_s64(int32x2_t lowpart, int64x2_t wide) {
  // CHECK: xtn2.4s v0, v1
  return vmovn_high_s64(lowpart, wide);
}

uint8x16_t test_vmovn_high_u16(uint8x8_t lowpart, uint16x8_t wide) {
  // CHECK: xtn2.16b v0, v1
  return vmovn_high_u16(lowpart, wide);
}

uint16x8_t test_vmovn_high_u32(uint16x4_t lowpart, uint32x4_t wide) {
  // CHECK: xtn2.8h v0, v1
  return vmovn_high_u32(lowpart, wide);
}

uint32x4_t test_vmovn_high_u64(uint32x2_t lowpart, uint64x2_t wide) {
  // CHECK: xtn2.4s v0, v1
  return vmovn_high_u64(lowpart, wide);
}

int8x16_t test_vqmovn_high_s16(int8x8_t lowpart, int16x8_t wide) {
  // CHECK: sqxtn2.16b v0, v1
  return vqmovn_high_s16(lowpart, wide);
}

int16x8_t test_vqmovn_high_s32(int16x4_t lowpart, int32x4_t wide) {
  // CHECK: sqxtn2.8h v0, v1
  return vqmovn_high_s32(lowpart, wide);
}

int32x4_t test_vqmovn_high_s64(int32x2_t lowpart, int64x2_t wide) {
  // CHECK: sqxtn2.4s v0, v1
  return vqmovn_high_s64(lowpart, wide);
}

uint8x16_t test_vqmovn_high_u16(uint8x8_t lowpart, int16x8_t wide) {
  // CHECK: uqxtn2.16b v0, v1
  return vqmovn_high_u16(lowpart, wide);
}

uint16x8_t test_vqmovn_high_u32(uint16x4_t lowpart, int32x4_t wide) {
  // CHECK: uqxtn2.8h v0, v1
  return vqmovn_high_u32(lowpart, wide);
}

uint32x4_t test_vqmovn_high_u64(uint32x2_t lowpart, int64x2_t wide) {
  // CHECK: uqxtn2.4s v0, v1
  return vqmovn_high_u64(lowpart, wide);
}

uint8x16_t test_vqmovun_high_s16(uint8x8_t lowpart, int16x8_t wide) {
  // CHECK: sqxtun2.16b v0, v1
  return vqmovun_high_s16(lowpart, wide);
}

uint16x8_t test_vqmovun_high_s32(uint16x4_t lowpart, int32x4_t wide) {
  // CHECK: sqxtun2.8h v0, v1
  return vqmovun_high_s32(lowpart, wide);
}

uint32x4_t test_vqmovun_high_s64(uint32x2_t lowpart, int64x2_t wide) {
  // CHECK: sqxtun2.4s v0, v1
  return vqmovun_high_s64(lowpart, wide);
}

float32x4_t test_vcvtx_high_f32_f64(float32x2_t lowpart, float64x2_t wide) {
  // CHECK: fcvtxn2 v0.4s, v1.2d
  return vcvtx_high_f32_f64(lowpart, wide);
}

float64x2_t test_vcvt_f64_f32(float32x2_t x) {
  // CHECK: fcvtl v0.2d, v0.2s
  return vcvt_f64_f32(x);
}

float64x2_t test_vcvt_high_f64_f32(float32x4_t x) {
  // CHECK: fcvtl2 v0.2d, v0.4s
  return vcvt_high_f64_f32(x);
}

float32x2_t test_vcvt_f32_f64(float64x2_t v) {
  // CHECK: fcvtn v0.2s, v0.2d
  return vcvt_f32_f64(v);
}

float32x4_t test_vcvt_high_f32_f64(float32x2_t x, float64x2_t v) {
  // CHECK: fcvtn2 v0.4s, v1.2d
  return vcvt_high_f32_f64(x, v);
}

float32x2_t test_vcvtx_f32_f64(float64x2_t v) {
  // CHECK: fcvtxn v0.2s, v0.2d
  return vcvtx_f32_f64(v);
}