// REQUIRES: aarch64-registered-target
// RUN: %clang_cc1 -triple arm64-none-linux-gnu -target-feature +neon \
// RUN:   -ffp-contract=fast -S -O3 -o - %s | FileCheck %s

#include <arm_neon.h>

uint8x16_t test_vld1q_dup_u8(uint8_t  *a) {
  // CHECK-LABEL: test_vld1q_dup_u8
  return vld1q_dup_u8(a);
  // CHECK: ld1r {{{ *v[0-9]+.16b *}}}, [{{x[0-9]+|sp}}]
}

uint16x8_t test_vld1q_dup_u16(uint16_t  *a) {
  // CHECK-LABEL: test_vld1q_dup_u16
  return vld1q_dup_u16(a);
  // CHECK: ld1r {{{ *v[0-9]+.8h *}}}, [{{x[0-9]+|sp}}]
}

uint32x4_t test_vld1q_dup_u32(uint32_t  *a) {
  // CHECK-LABEL: test_vld1q_dup_u32
  return vld1q_dup_u32(a);
  // CHECK: ld1r {{{ *v[0-9]+.4s *}}}, [{{x[0-9]+|sp}}]
}

uint64x2_t test_vld1q_dup_u64(uint64_t  *a) {
  // CHECK-LABEL: test_vld1q_dup_u64
  return vld1q_dup_u64(a);
  // CHECK: ld1r {{{ *v[0-9]+.2d *}}}, [{{x[0-9]+|sp}}]
}

int8x16_t test_vld1q_dup_s8(int8_t  *a) {
  // CHECK-LABEL: test_vld1q_dup_s8
  return vld1q_dup_s8(a);
  // CHECK: ld1r {{{ *v[0-9]+.16b *}}}, [{{x[0-9]+|sp}}]
}

int16x8_t test_vld1q_dup_s16(int16_t  *a) {
  // CHECK-LABEL: test_vld1q_dup_s16
  return vld1q_dup_s16(a);
  // CHECK: ld1r {{{ *v[0-9]+.8h *}}}, [{{x[0-9]+|sp}}]
}

int32x4_t test_vld1q_dup_s32(int32_t  *a) {
  // CHECK-LABEL: test_vld1q_dup_s32
  return vld1q_dup_s32(a);
  // CHECK: ld1r {{{ *v[0-9]+.4s *}}}, [{{x[0-9]+|sp}}]
}

int64x2_t test_vld1q_dup_s64(int64_t  *a) {
  // CHECK-LABEL: test_vld1q_dup_s64
  return vld1q_dup_s64(a);
  // CHECK: ld1r {{{ *v[0-9]+.2d *}}}, [{{x[0-9]+|sp}}]
}

float16x8_t test_vld1q_dup_f16(float16_t  *a) {
  // CHECK-LABEL: test_vld1q_dup_f16
  return vld1q_dup_f16(a);
  // CHECK: ld1r {{{ *v[0-9]+.8h *}}}, [{{x[0-9]+|sp}}]
}

float32x4_t test_vld1q_dup_f32(float32_t  *a) {
  // CHECK-LABEL: test_vld1q_dup_f32
  return vld1q_dup_f32(a);
  // CHECK: ld1r {{{ *v[0-9]+.4s *}}}, [{{x[0-9]+|sp}}]
}

float64x2_t test_vld1q_dup_f64(float64_t  *a) {
  // CHECK-LABEL: test_vld1q_dup_f64
  return vld1q_dup_f64(a);
  // CHECK: ld1r {{{ *v[0-9]+.2d *}}}, [{{x[0-9]+|sp}}]
}

poly8x16_t test_vld1q_dup_p8(poly8_t  *a) {
  // CHECK-LABEL: test_vld1q_dup_p8
  return vld1q_dup_p8(a);
  // CHECK: ld1r {{{ *v[0-9]+.16b *}}}, [{{x[0-9]+|sp}}]
}

poly16x8_t test_vld1q_dup_p16(poly16_t  *a) {
  // CHECK-LABEL: test_vld1q_dup_p16
  return vld1q_dup_p16(a);
  // CHECK: ld1r {{{ *v[0-9]+.8h *}}}, [{{x[0-9]+|sp}}]
}

poly64x2_t test_vld1q_dup_p64(poly64_t  *a) {
  // CHECK-LABEL: test_vld1q_dup_p64
  return vld1q_dup_p64(a);
  // CHECK: ld1r {{{ *v[0-9]+.2d *}}}, [{{x[0-9]+|sp}}]
}

uint8x8_t test_vld1_dup_u8(uint8_t  *a) {
  // CHECK-LABEL: test_vld1_dup_u8
  return vld1_dup_u8(a);
  // CHECK: ld1r {{{ *v[0-9]+.8b *}}}, [{{x[0-9]+|sp}}]
}

uint16x4_t test_vld1_dup_u16(uint16_t  *a) {
  // CHECK-LABEL: test_vld1_dup_u16
  return vld1_dup_u16(a);
  // CHECK: ld1r {{{ *v[0-9]+.4h *}}}, [{{x[0-9]+|sp}}]
}

uint32x2_t test_vld1_dup_u32(uint32_t  *a) {
  // CHECK-LABEL: test_vld1_dup_u32
  return vld1_dup_u32(a);
  // CHECK: ld1r {{{ *v[0-9]+.2s *}}}, [{{x[0-9]+|sp}}]
}

uint64x1_t test_vld1_dup_u64(uint64_t  *a) {
  // CHECK-LABEL: test_vld1_dup_u64
  return vld1_dup_u64(a);
  // CHECK: {{ld1r { v[0-9]+.1d }|ldr d[0-9]+}}, [{{x[0-9]+|sp}}]
}

int8x8_t test_vld1_dup_s8(int8_t  *a) {
  // CHECK-LABEL: test_vld1_dup_s8
  return vld1_dup_s8(a);
  // CHECK: ld1r {{{ *v[0-9]+.8b *}}}, [{{x[0-9]+|sp}}]
}

int16x4_t test_vld1_dup_s16(int16_t  *a) {
  // CHECK-LABEL: test_vld1_dup_s16
  return vld1_dup_s16(a);
  // CHECK: ld1r {{{ *v[0-9]+.4h *}}}, [{{x[0-9]+|sp}}]
}

int32x2_t test_vld1_dup_s32(int32_t  *a) {
  // CHECK-LABEL: test_vld1_dup_s32
  return vld1_dup_s32(a);
  // CHECK: ld1r {{{ *v[0-9]+.2s *}}}, [{{x[0-9]+|sp}}]
}

int64x1_t test_vld1_dup_s64(int64_t  *a) {
  // CHECK-LABEL: test_vld1_dup_s64
  return vld1_dup_s64(a);
  // CHECK: {{ld1r { v[0-9]+.1d }|ldr d[0-9]+}}, [{{x[0-9]+|sp}}]
}

float16x4_t test_vld1_dup_f16(float16_t  *a) {
  // CHECK-LABEL: test_vld1_dup_f16
  return vld1_dup_f16(a);
  // CHECK: ld1r {{{ *v[0-9]+.4h *}}}, [{{x[0-9]+|sp}}]
}

float32x2_t test_vld1_dup_f32(float32_t  *a) {
  // CHECK-LABEL: test_vld1_dup_f32
  return vld1_dup_f32(a);
  // CHECK: ld1r {{{ *v[0-9]+.2s *}}}, [{{x[0-9]+|sp}}]
}

float64x1_t test_vld1_dup_f64(float64_t  *a) {
  // CHECK-LABEL: test_vld1_dup_f64
  return vld1_dup_f64(a);
  // CHECK: {{ld1r { v[0-9]+.1d }|ldr d[0-9]+}}, [{{x[0-9]+|sp}}]
}

poly8x8_t test_vld1_dup_p8(poly8_t  *a) {
  // CHECK-LABEL: test_vld1_dup_p8
  return vld1_dup_p8(a);
  // CHECK: ld1r {{{ *v[0-9]+.8b *}}}, [{{x[0-9]+|sp}}]
}

poly16x4_t test_vld1_dup_p16(poly16_t  *a) {
  // CHECK-LABEL: test_vld1_dup_p16
  return vld1_dup_p16(a);
  // CHECK: ld1r {{{ *v[0-9]+.4h *}}}, [{{x[0-9]+|sp}}]
}

poly64x1_t test_vld1_dup_p64(poly64_t  *a) {
  // CHECK-LABEL: test_vld1_dup_p64
  return vld1_dup_p64(a);
  // CHECK: {{ld1r { v[0-9]+.1d }|ldr d[0-9]+}}, [{{x[0-9]+|sp}}]
}

uint8x16x2_t test_vld2q_dup_u8(uint8_t  *a) {
  // CHECK-LABEL: test_vld2q_dup_u8
  return vld2q_dup_u8(a);
  // CHECK: ld2r {{{ *v[0-9]+.16b, v[0-9]+.16b *}}}, [{{x[0-9]+|sp}}]
}

uint16x8x2_t test_vld2q_dup_u16(uint16_t  *a) {
  // CHECK-LABEL: test_vld2q_dup_u16
  return vld2q_dup_u16(a);
  // CHECK: ld2r {{{ *v[0-9]+.8h, v[0-9]+.8h *}}}, [{{x[0-9]+|sp}}]
}

uint32x4x2_t test_vld2q_dup_u32(uint32_t  *a) {
  // CHECK-LABEL: test_vld2q_dup_u32
  return vld2q_dup_u32(a);
  // CHECK: ld2r {{{ *v[0-9]+.4s, v[0-9]+.4s *}}}, [{{x[0-9]+|sp}}]
}

uint64x2x2_t test_vld2q_dup_u64(uint64_t  *a) {
  // CHECK-LABEL: test_vld2q_dup_u64
  return vld2q_dup_u64(a);
  // CHECK: ld2r {{{ *v[0-9]+.2d, v[0-9]+.2d *}}}, [{{x[0-9]+|sp}}]
}

int8x16x2_t test_vld2q_dup_s8(int8_t  *a) {
  // CHECK-LABEL: test_vld2q_dup_s8
  return vld2q_dup_s8(a);
  // CHECK: ld2r {{{ *v[0-9]+.16b, v[0-9]+.16b *}}}, [{{x[0-9]+|sp}}]
}

int16x8x2_t test_vld2q_dup_s16(int16_t  *a) {
  // CHECK-LABEL: test_vld2q_dup_s16
  return vld2q_dup_s16(a);
  // CHECK: ld2r {{{ *v[0-9]+.8h, v[0-9]+.8h *}}}, [{{x[0-9]+|sp}}]
}

int32x4x2_t test_vld2q_dup_s32(int32_t  *a) {
  // CHECK-LABEL: test_vld2q_dup_s32
  return vld2q_dup_s32(a);
  // CHECK: ld2r {{{ *v[0-9]+.4s, v[0-9]+.4s *}}}, [{{x[0-9]+|sp}}]
}

int64x2x2_t test_vld2q_dup_s64(int64_t  *a) {
  // CHECK-LABEL: test_vld2q_dup_s64
  return vld2q_dup_s64(a);
  // CHECK: ld2r {{{ *v[0-9]+.2d, v[0-9]+.2d *}}}, [{{x[0-9]+|sp}}]
}

float16x8x2_t test_vld2q_dup_f16(float16_t  *a) {
  // CHECK-LABEL: test_vld2q_dup_f16
  return vld2q_dup_f16(a);
  // CHECK: ld2r {{{ *v[0-9]+.8h, v[0-9]+.8h *}}}, [{{x[0-9]+|sp}}]
}

float32x4x2_t test_vld2q_dup_f32(float32_t  *a) {
  // CHECK-LABEL: test_vld2q_dup_f32
  return vld2q_dup_f32(a);
  // CHECK: ld2r {{{ *v[0-9]+.4s, v[0-9]+.4s *}}}, [{{x[0-9]+|sp}}]
}

float64x2x2_t test_vld2q_dup_f64(float64_t  *a) {
  // CHECK-LABEL: test_vld2q_dup_f64
  return vld2q_dup_f64(a);
  // CHECK: ld2r {{{ *v[0-9]+.2d, v[0-9]+.2d *}}}, [{{x[0-9]+|sp}}]
}

poly8x16x2_t test_vld2q_dup_p8(poly8_t  *a) {
  // CHECK-LABEL: test_vld2q_dup_p8
  return vld2q_dup_p8(a);
  // CHECK: ld2r {{{ *v[0-9]+.16b, v[0-9]+.16b *}}}, [{{x[0-9]+|sp}}]
}

poly16x8x2_t test_vld2q_dup_p16(poly16_t  *a) {
  // CHECK-LABEL: test_vld2q_dup_p16
  return vld2q_dup_p16(a);
  // CHECK: ld2r {{{ *v[0-9]+.8h, v[0-9]+.8h *}}}, [{{x[0-9]+|sp}}]
}

poly64x2x2_t test_vld2q_dup_p64(poly64_t  *a) {
  // CHECK-LABEL: test_vld2q_dup_p64
  return vld2q_dup_p64(a);
  // CHECK: ld2r {{{ *v[0-9]+.2d, v[0-9]+.2d *}}}, [{{x[0-9]+|sp}}]
}

uint8x8x2_t test_vld2_dup_u8(uint8_t  *a) {
  // CHECK-LABEL: test_vld2_dup_u8
  return vld2_dup_u8(a);
  // CHECK: ld2r {{{ *v[0-9]+.8b, v[0-9]+.8b *}}}, [{{x[0-9]+|sp}}]
}

uint16x4x2_t test_vld2_dup_u16(uint16_t  *a) {
  // CHECK-LABEL: test_vld2_dup_u16
  return vld2_dup_u16(a);
  // CHECK: ld2r {{{ *v[0-9]+.4h, v[0-9]+.4h *}}}, [{{x[0-9]+|sp}}]
}

uint32x2x2_t test_vld2_dup_u32(uint32_t  *a) {
  // CHECK-LABEL: test_vld2_dup_u32
  return vld2_dup_u32(a);
  // CHECK: ld2r {{{ *v[0-9]+.2s, v[0-9]+.2s *}}}, [{{x[0-9]+|sp}}]
}

uint64x1x2_t test_vld2_dup_u64(uint64_t  *a) {
  // CHECK-LABEL: test_vld2_dup_u64
  return vld2_dup_u64(a);
  // CHECK: {{ld1|ld2r}} {{{ *v[0-9]+.1d, v[0-9]+.1d *}}}, [{{x[0-9]+|sp}}]
}

int8x8x2_t test_vld2_dup_s8(int8_t  *a) {
  // CHECK-LABEL: test_vld2_dup_s8
  return vld2_dup_s8(a);
  // CHECK: ld2r {{{ *v[0-9]+.8b, v[0-9]+.8b *}}}, [{{x[0-9]+|sp}}]
}

int16x4x2_t test_vld2_dup_s16(int16_t  *a) {
  // CHECK-LABEL: test_vld2_dup_s16
  return vld2_dup_s16(a);
  // CHECK: ld2r {{{ *v[0-9]+.4h, v[0-9]+.4h *}}}, [{{x[0-9]+|sp}}]
}

int32x2x2_t test_vld2_dup_s32(int32_t  *a) {
  // CHECK-LABEL: test_vld2_dup_s32
  return vld2_dup_s32(a);
  // CHECK: ld2r {{{ *v[0-9]+.2s, v[0-9]+.2s *}}}, [{{x[0-9]+|sp}}]
}

int64x1x2_t test_vld2_dup_s64(int64_t  *a) {
  // CHECK-LABEL: test_vld2_dup_s64
  return vld2_dup_s64(a);
  // CHECK: {{ld1|ld2r}} {{{ *v[0-9]+.1d, v[0-9]+.1d *}}}, [{{x[0-9]+|sp}}]
}

float16x4x2_t test_vld2_dup_f16(float16_t  *a) {
  // CHECK-LABEL: test_vld2_dup_f16
  return vld2_dup_f16(a);
  // CHECK: ld2r {{{ *v[0-9]+.4h, v[0-9]+.4h *}}}, [{{x[0-9]+|sp}}]
}

float32x2x2_t test_vld2_dup_f32(float32_t  *a) {
  // CHECK-LABEL: test_vld2_dup_f32
  return vld2_dup_f32(a);
  // CHECK: ld2r {{{ *v[0-9]+.2s, v[0-9]+.2s *}}}, [{{x[0-9]+|sp}}]
}

float64x1x2_t test_vld2_dup_f64(float64_t  *a) {
  // CHECK-LABEL: test_vld2_dup_f64
  return vld2_dup_f64(a);
  // CHECK: {{ld1|ld2r}} {{{ *v[0-9]+.1d, v[0-9]+.1d *}}}, [{{x[0-9]+|sp}}]
}

poly8x8x2_t test_vld2_dup_p8(poly8_t  *a) {
  // CHECK-LABEL: test_vld2_dup_p8
  return vld2_dup_p8(a);
  // CHECK: ld2r {{{ *v[0-9]+.8b, v[0-9]+.8b *}}}, [{{x[0-9]+|sp}}]
}

poly16x4x2_t test_vld2_dup_p16(poly16_t  *a) {
  // CHECK-LABEL: test_vld2_dup_p16
  return vld2_dup_p16(a);
  // CHECK: ld2r {{{ *v[0-9]+.4h, v[0-9]+.4h *}}}, [{{x[0-9]+|sp}}]
}

poly64x1x2_t test_vld2_dup_p64(poly64_t  *a) {
  // CHECK-LABEL: test_vld2_dup_p64
  return vld2_dup_p64(a);
  // CHECK: {{ld1|ld2r}} {{{ *v[0-9]+.1d, v[0-9]+.1d *}}}, [{{x[0-9]+|sp}}]
}

uint8x16x3_t test_vld3q_dup_u8(uint8_t  *a) {
  // CHECK-LABEL: test_vld3q_dup_u8
  return vld3q_dup_u8(a);
  // CHECK: ld3r {{{ *v[0-9]+.16b, v[0-9]+.16b, v[0-9]+.16b *}}},
  // [{{x[0-9]+|sp}}]
}

uint16x8x3_t test_vld3q_dup_u16(uint16_t  *a) {
  // CHECK-LABEL: test_vld3q_dup_u16
  return vld3q_dup_u16(a);
  // CHECK: ld3r {{{ *v[0-9]+.8h, v[0-9]+.8h, v[0-9]+.8h *}}},
  // [{{x[0-9]+|sp}}]
}

uint32x4x3_t test_vld3q_dup_u32(uint32_t  *a) {
  // CHECK-LABEL: test_vld3q_dup_u32
  return vld3q_dup_u32(a);
  // CHECK: ld3r {{{ *v[0-9]+.4s, v[0-9]+.4s, v[0-9]+.4s *}}},
  // [{{x[0-9]+|sp}}]
}

uint64x2x3_t test_vld3q_dup_u64(uint64_t  *a) {
  // CHECK-LABEL: test_vld3q_dup_u64
  return vld3q_dup_u64(a);
  // CHECK: ld3r {{{ *v[0-9]+.2d, v[0-9]+.2d, v[0-9]+.2d *}}},
  // [{{x[0-9]+|sp}}]
}

int8x16x3_t test_vld3q_dup_s8(int8_t  *a) {
  // CHECK-LABEL: test_vld3q_dup_s8
  return vld3q_dup_s8(a);
  // CHECK: ld3r {{{ *v[0-9]+.16b, v[0-9]+.16b, v[0-9]+.16b *}}},
  // [{{x[0-9]+|sp}}]
}

int16x8x3_t test_vld3q_dup_s16(int16_t  *a) {
  // CHECK-LABEL: test_vld3q_dup_s16
  return vld3q_dup_s16(a);
  // CHECK: ld3r {{{ *v[0-9]+.8h, v[0-9]+.8h, v[0-9]+.8h *}}},
  // [{{x[0-9]+|sp}}]
}

int32x4x3_t test_vld3q_dup_s32(int32_t  *a) {
  // CHECK-LABEL: test_vld3q_dup_s32
  return vld3q_dup_s32(a);
  // CHECK: ld3r {{{ *v[0-9]+.4s, v[0-9]+.4s, v[0-9]+.4s *}}},
  // [{{x[0-9]+|sp}}]
}

int64x2x3_t test_vld3q_dup_s64(int64_t  *a) {
  // CHECK-LABEL: test_vld3q_dup_s64
  return vld3q_dup_s64(a);
  // CHECK: ld3r {{{ *v[0-9]+.2d, v[0-9]+.2d, v[0-9]+.2d *}}},
  // [{{x[0-9]+|sp}}]
}

float16x8x3_t test_vld3q_dup_f16(float16_t  *a) {
  // CHECK-LABEL: test_vld3q_dup_f16
  return vld3q_dup_f16(a);
  // CHECK: ld3r {{{ *v[0-9]+.8h, v[0-9]+.8h, v[0-9]+.8h *}}},
  // [{{x[0-9]+|sp}}]
}

float32x4x3_t test_vld3q_dup_f32(float32_t  *a) {
  // CHECK-LABEL: test_vld3q_dup_f32
  return vld3q_dup_f32(a);
  // CHECK: ld3r {{{ *v[0-9]+.4s, v[0-9]+.4s, v[0-9]+.4s *}}},
  // [{{x[0-9]+|sp}}]
}

float64x2x3_t test_vld3q_dup_f64(float64_t  *a) {
  // CHECK-LABEL: test_vld3q_dup_f64
  return vld3q_dup_f64(a);
  // CHECK: ld3r {{{ *v[0-9]+.2d, v[0-9]+.2d, v[0-9]+.2d *}}},
  // [{{x[0-9]+|sp}}]
}

poly8x16x3_t test_vld3q_dup_p8(poly8_t  *a) {
  // CHECK-LABEL: test_vld3q_dup_p8
  return vld3q_dup_p8(a);
  // CHECK: ld3r {{{ *v[0-9]+.16b, v[0-9]+.16b, v[0-9]+.16b *}}},
  // [{{x[0-9]+|sp}}]
}

poly16x8x3_t test_vld3q_dup_p16(poly16_t  *a) {
  // CHECK-LABEL: test_vld3q_dup_p16
  return vld3q_dup_p16(a);
  // CHECK: ld3r {{{ *v[0-9]+.8h, v[0-9]+.8h, v[0-9]+.8h *}}},
  // [{{x[0-9]+|sp}}]
}

poly64x2x3_t test_vld3q_dup_p64(poly64_t  *a) {
  // CHECK-LABEL: test_vld3q_dup_p64
  return vld3q_dup_p64(a);
  // CHECK: ld3r {{{ *v[0-9]+.2d, v[0-9]+.2d, v[0-9]+.2d *}}},
  // [{{x[0-9]+|sp}}]
}

uint8x8x3_t test_vld3_dup_u8(uint8_t  *a) {
  // CHECK-LABEL: test_vld3_dup_u8
  return vld3_dup_u8(a);
  // CHECK: ld3r {{{ *v[0-9]+.8b, v[0-9]+.8b, v[0-9]+.8b *}}},
  // [{{x[0-9]+|sp}}]
}

uint16x4x3_t test_vld3_dup_u16(uint16_t  *a) {
  // CHECK-LABEL: test_vld3_dup_u16
  return vld3_dup_u16(a);
  // CHECK: ld3r {{{ *v[0-9]+.4h, v[0-9]+.4h, v[0-9]+.4h *}}},
  // [{{x[0-9]+|sp}}]
}

uint32x2x3_t test_vld3_dup_u32(uint32_t  *a) {
  // CHECK-LABEL: test_vld3_dup_u32
  return vld3_dup_u32(a);
  // CHECK: ld3r {{{ *v[0-9]+.2s, v[0-9]+.2s, v[0-9]+.2s *}}},
  // [{{x[0-9]+|sp}}]
}

uint64x1x3_t test_vld3_dup_u64(uint64_t  *a) {
  // CHECK-LABEL: test_vld3_dup_u64
  return vld3_dup_u64(a);
  // CHECK: {{ld1|ld3r}} {{{ *v[0-9]+.1d, v[0-9]+.1d, v[0-9]+.1d *}}},
  // [{{x[0-9]+|sp}}]
}

int8x8x3_t test_vld3_dup_s8(int8_t  *a) {
  // CHECK-LABEL: test_vld3_dup_s8
  return vld3_dup_s8(a);
  // CHECK: ld3r {{{ *v[0-9]+.8b, v[0-9]+.8b, v[0-9]+.8b *}}},
  // [{{x[0-9]+|sp}}]
}

int16x4x3_t test_vld3_dup_s16(int16_t  *a) {
  // CHECK-LABEL: test_vld3_dup_s16
  return vld3_dup_s16(a);
  // CHECK: ld3r {{{ *v[0-9]+.4h, v[0-9]+.4h, v[0-9]+.4h *}}},
  // [{{x[0-9]+|sp}}]
}

int32x2x3_t test_vld3_dup_s32(int32_t  *a) {
  // CHECK-LABEL: test_vld3_dup_s32
  return vld3_dup_s32(a);
  // CHECK: ld3r {{{ *v[0-9]+.2s, v[0-9]+.2s, v[0-9]+.2s *}}},
  // [{{x[0-9]+|sp}}]
}

int64x1x3_t test_vld3_dup_s64(int64_t  *a) {
  // CHECK-LABEL: test_vld3_dup_s64
  return vld3_dup_s64(a);
  // CHECK: {{ld1|ld3r}} {{{ *v[0-9]+.1d, v[0-9]+.1d, v[0-9]+.1d *}}},
  // [{{x[0-9]+|sp}}]
}

float16x4x3_t test_vld3_dup_f16(float16_t  *a) {
  // CHECK-LABEL: test_vld3_dup_f16
  return vld3_dup_f16(a);
  // CHECK: ld3r {{{ *v[0-9]+.4h, v[0-9]+.4h, v[0-9]+.4h *}}},
  // [{{x[0-9]+|sp}}]
}

float32x2x3_t test_vld3_dup_f32(float32_t  *a) {
  // CHECK-LABEL: test_vld3_dup_f32
  return vld3_dup_f32(a);
  // CHECK: ld3r {{{ *v[0-9]+.2s, v[0-9]+.2s, v[0-9]+.2s *}}},
  // [{{x[0-9]+|sp}}]
}

float64x1x3_t test_vld3_dup_f64(float64_t  *a) {
  // CHECK-LABEL: test_vld3_dup_f64
  return vld3_dup_f64(a);
  // CHECK: {{ld1|ld3r}} {{{ *v[0-9]+.1d, v[0-9]+.1d, v[0-9]+.1d *}}},
  // [{{x[0-9]+|sp}}]
}

poly8x8x3_t test_vld3_dup_p8(poly8_t  *a) {
  // CHECK-LABEL: test_vld3_dup_p8
  return vld3_dup_p8(a);
  // CHECK: ld3r {{{ *v[0-9]+.8b, v[0-9]+.8b, v[0-9]+.8b *}}},
  // [{{x[0-9]+|sp}}]
}

poly16x4x3_t test_vld3_dup_p16(poly16_t  *a) {
  // CHECK-LABEL: test_vld3_dup_p16
  return vld3_dup_p16(a);
  // CHECK: ld3r {{{ *v[0-9]+.4h, v[0-9]+.4h, v[0-9]+.4h *}}},
  // [{{x[0-9]+|sp}}]
}

poly64x1x3_t test_vld3_dup_p64(poly64_t  *a) {
  // CHECK-LABEL: test_vld3_dup_p64
  return vld3_dup_p64(a);
  // CHECK: {{ld1|ld3r}} {{{ *v[0-9]+.1d, v[0-9]+.1d, v[0-9]+.1d *}}},
  // [{{x[0-9]+|sp}}]
}

uint8x16x4_t test_vld4q_dup_u8(uint8_t  *a) {
  // CHECK-LABEL: test_vld4q_dup_u8
  return vld4q_dup_u8(a);
  // CHECK: ld4r {{{ *v[0-9]+.16b, v[0-9]+.16b, v[0-9]+.16b, v[0-9]+.16b *}}}, [{{x[0-9]+|sp}}]
}

uint16x8x4_t test_vld4q_dup_u16(uint16_t  *a) {
  // CHECK-LABEL: test_vld4q_dup_u16
  return vld4q_dup_u16(a);
  // CHECK: ld4r {{{ *v[0-9]+.8h, v[0-9]+.8h, v[0-9]+.8h, v[0-9]+.8h *}}}, [{{x[0-9]+|sp}}]
}

uint32x4x4_t test_vld4q_dup_u32(uint32_t  *a) {
  // CHECK-LABEL: test_vld4q_dup_u32
  return vld4q_dup_u32(a);
  // CHECK: ld4r {{{ *v[0-9]+.4s, v[0-9]+.4s, v[0-9]+.4s, v[0-9]+.4s *}}}, [{{x[0-9]+|sp}}]
}

uint64x2x4_t test_vld4q_dup_u64(uint64_t  *a) {
  // CHECK-LABEL: test_vld4q_dup_u64
  return vld4q_dup_u64(a);
  // CHECK: ld4r {{{ *v[0-9]+.2d, v[0-9]+.2d, v[0-9]+.2d, v[0-9]+.2d *}}}, [{{x[0-9]+|sp}}]
}

int8x16x4_t test_vld4q_dup_s8(int8_t  *a) {
  // CHECK-LABEL: test_vld4q_dup_s8
  return vld4q_dup_s8(a);
  // CHECK: ld4r {{{ *v[0-9]+.16b, v[0-9]+.16b, v[0-9]+.16b, v[0-9]+.16b *}}}, [{{x[0-9]+|sp}}]
}

int16x8x4_t test_vld4q_dup_s16(int16_t  *a) {
  // CHECK-LABEL: test_vld4q_dup_s16
  return vld4q_dup_s16(a);
  // CHECK: ld4r {{{ *v[0-9]+.8h, v[0-9]+.8h, v[0-9]+.8h, v[0-9]+.8h *}}}, [{{x[0-9]+|sp}}]
}

int32x4x4_t test_vld4q_dup_s32(int32_t  *a) {
  // CHECK-LABEL: test_vld4q_dup_s32
  return vld4q_dup_s32(a);
  // CHECK: ld4r {{{ *v[0-9]+.4s, v[0-9]+.4s, v[0-9]+.4s, v[0-9]+.4s *}}}, [{{x[0-9]+|sp}}]
}

int64x2x4_t test_vld4q_dup_s64(int64_t  *a) {
  // CHECK-LABEL: test_vld4q_dup_s64
  return vld4q_dup_s64(a);
  // CHECK: ld4r {{{ *v[0-9]+.2d, v[0-9]+.2d, v[0-9]+.2d, v[0-9]+.2d *}}}, [{{x[0-9]+|sp}}]
}

float16x8x4_t test_vld4q_dup_f16(float16_t  *a) {
  // CHECK-LABEL: test_vld4q_dup_f16
  return vld4q_dup_f16(a);
  // CHECK: ld4r {{{ *v[0-9]+.8h, v[0-9]+.8h, v[0-9]+.8h, v[0-9]+.8h *}}}, [{{x[0-9]+|sp}}]
}

float32x4x4_t test_vld4q_dup_f32(float32_t  *a) {
  // CHECK-LABEL: test_vld4q_dup_f32
  return vld4q_dup_f32(a);
  // CHECK: ld4r {{{ *v[0-9]+.4s, v[0-9]+.4s, v[0-9]+.4s, v[0-9]+.4s *}}}, [{{x[0-9]+|sp}}]
}

float64x2x4_t test_vld4q_dup_f64(float64_t  *a) {
  // CHECK-LABEL: test_vld4q_dup_f64
  return vld4q_dup_f64(a);
  // CHECK: ld4r {{{ *v[0-9]+.2d, v[0-9]+.2d, v[0-9]+.2d, v[0-9]+.2d *}}}, [{{x[0-9]+|sp}}]
}

poly8x16x4_t test_vld4q_dup_p8(poly8_t  *a) {
  // CHECK-LABEL: test_vld4q_dup_p8
  return vld4q_dup_p8(a);
  // CHECK: ld4r {{{ *v[0-9]+.16b, v[0-9]+.16b, v[0-9]+.16b, v[0-9]+.16b *}}}, [{{x[0-9]+|sp}}]
}

poly16x8x4_t test_vld4q_dup_p16(poly16_t  *a) {
  // CHECK-LABEL: test_vld4q_dup_p16
  return vld4q_dup_p16(a);
  // CHECK: ld4r {{{ *v[0-9]+.8h, v[0-9]+.8h, v[0-9]+.8h, v[0-9]+.8h *}}}, [{{x[0-9]+|sp}}]
}

poly64x2x4_t test_vld4q_dup_p64(poly64_t  *a) {
  // CHECK-LABEL: test_vld4q_dup_p64
  return vld4q_dup_p64(a);
  // CHECK: ld4r {{{ *v[0-9]+.2d, v[0-9]+.2d, v[0-9]+.2d, v[0-9]+.2d *}}}, [{{x[0-9]+|sp}}]
}

uint8x8x4_t test_vld4_dup_u8(uint8_t  *a) {
  // CHECK-LABEL: test_vld4_dup_u8
  return vld4_dup_u8(a);
  // CHECK: ld4r {{{ *v[0-9]+.8b, v[0-9]+.8b, v[0-9]+.8b, v[0-9]+.8b *}}}, [{{x[0-9]+|sp}}]
}

uint16x4x4_t test_vld4_dup_u16(uint16_t  *a) {
  // CHECK-LABEL: test_vld4_dup_u16
  return vld4_dup_u16(a);
  // CHECK: ld4r {{{ *v[0-9]+.4h, v[0-9]+.4h, v[0-9]+.4h, v[0-9]+.4h *}}}, [{{x[0-9]+|sp}}]
}

uint32x2x4_t test_vld4_dup_u32(uint32_t  *a) {
  // CHECK-LABEL: test_vld4_dup_u32
  return vld4_dup_u32(a);
  // CHECK: ld4r {{{ *v[0-9]+.2s, v[0-9]+.2s, v[0-9]+.2s, v[0-9]+.2s *}}}, [{{x[0-9]+|sp}}]
}

uint64x1x4_t test_vld4_dup_u64(uint64_t  *a) {
  // CHECK-LABEL: test_vld4_dup_u64
  return vld4_dup_u64(a);
  // CHECK: {{ld1|ld4r}} {{{ *v[0-9]+.1d, v[0-9]+.1d, v[0-9]+.1d, v[0-9]+.1d *}}}, [{{x[0-9]+|sp}}]
}

int8x8x4_t test_vld4_dup_s8(int8_t  *a) {
  // CHECK-LABEL: test_vld4_dup_s8
  return vld4_dup_s8(a);
  // CHECK: ld4r {{{ *v[0-9]+.8b, v[0-9]+.8b, v[0-9]+.8b, v[0-9]+.8b *}}}, [{{x[0-9]+|sp}}]
}

int16x4x4_t test_vld4_dup_s16(int16_t  *a) {
  // CHECK-LABEL: test_vld4_dup_s16
  return vld4_dup_s16(a);
  // CHECK: ld4r {{{ *v[0-9]+.4h, v[0-9]+.4h, v[0-9]+.4h, v[0-9]+.4h *}}}, [{{x[0-9]+|sp}}]
}

int32x2x4_t test_vld4_dup_s32(int32_t  *a) {
  // CHECK-LABEL: test_vld4_dup_s32
  return vld4_dup_s32(a);
  // CHECK: ld4r {{{ *v[0-9]+.2s, v[0-9]+.2s, v[0-9]+.2s, v[0-9]+.2s *}}}, [{{x[0-9]+|sp}}]
}

int64x1x4_t test_vld4_dup_s64(int64_t  *a) {
  // CHECK-LABEL: test_vld4_dup_s64
  return vld4_dup_s64(a);
  // CHECK: {{ld1|ld4r}} {{{ *v[0-9]+.1d, v[0-9]+.1d, v[0-9]+.1d, v[0-9]+.1d *}}}, [{{x[0-9]+|sp}}]
}

float16x4x4_t test_vld4_dup_f16(float16_t  *a) {
  // CHECK-LABEL: test_vld4_dup_f16
  return vld4_dup_f16(a);
  // CHECK: ld4r {{{ *v[0-9]+.4h, v[0-9]+.4h, v[0-9]+.4h, v[0-9]+.4h *}}}, [{{x[0-9]+|sp}}]
}

float32x2x4_t test_vld4_dup_f32(float32_t  *a) {
  // CHECK-LABEL: test_vld4_dup_f32
  return vld4_dup_f32(a);
  // CHECK: ld4r {{{ *v[0-9]+.2s, v[0-9]+.2s, v[0-9]+.2s, v[0-9]+.2s *}}}, [{{x[0-9]+|sp}}]
}

float64x1x4_t test_vld4_dup_f64(float64_t  *a) {
  // CHECK-LABEL: test_vld4_dup_f64
  return vld4_dup_f64(a);
  // CHECK: {{ld1|ld4r}} {{{ *v[0-9]+.1d, v[0-9]+.1d, v[0-9]+.1d, v[0-9]+.1d *}}}, [{{x[0-9]+|sp}}]
}

poly8x8x4_t test_vld4_dup_p8(poly8_t  *a) {
  // CHECK-LABEL: test_vld4_dup_p8
  return vld4_dup_p8(a);
  // CHECK: ld4r {{{ *v[0-9]+.8b, v[0-9]+.8b, v[0-9]+.8b, v[0-9]+.8b *}}}, [{{x[0-9]+|sp}}]
}

poly16x4x4_t test_vld4_dup_p16(poly16_t  *a) {
  // CHECK-LABEL: test_vld4_dup_p16
  return vld4_dup_p16(a);
  // CHECK: ld4r {{{ *v[0-9]+.4h, v[0-9]+.4h, v[0-9]+.4h, v[0-9]+.4h *}}}, [{{x[0-9]+|sp}}]
}

poly64x1x4_t test_vld4_dup_p64(poly64_t  *a) {
  // CHECK-LABEL: test_vld4_dup_p64
  return vld4_dup_p64(a);
  // CHECK: {{ld1|ld4r}} {{{ *v[0-9]+.1d, v[0-9]+.1d, v[0-9]+.1d, v[0-9]+.1d *}}}, [{{x[0-9]+|sp}}]
}

uint8x16_t test_vld1q_lane_u8(uint8_t  *a, uint8x16_t b) {
  // CHECK-LABEL: test_vld1q_lane_u8
  return vld1q_lane_u8(a, b, 15);
  // CHECK: ld1 {{{ *v[0-9]+.b *}}}[15], [{{x[0-9]+|sp}}]
}

uint16x8_t test_vld1q_lane_u16(uint16_t  *a, uint16x8_t b) {
  // CHECK-LABEL: test_vld1q_lane_u16
  return vld1q_lane_u16(a, b, 7);
  // CHECK: ld1 {{{ *v[0-9]+.h *}}}[7], [{{x[0-9]+|sp}}]
}

uint32x4_t test_vld1q_lane_u32(uint32_t  *a, uint32x4_t b) {
  // CHECK-LABEL: test_vld1q_lane_u32
  return vld1q_lane_u32(a, b, 3);
  // CHECK: ld1 {{{ *v[0-9]+.s *}}}[3], [{{x[0-9]+|sp}}]
}

uint64x2_t test_vld1q_lane_u64(uint64_t  *a, uint64x2_t b) {
  // CHECK-LABEL: test_vld1q_lane_u64
  return vld1q_lane_u64(a, b, 1);
  // CHECK: ld1 {{{ *v[0-9]+.d *}}}[1], [{{x[0-9]+|sp}}]
}

int8x16_t test_vld1q_lane_s8(int8_t  *a, int8x16_t b) {
  // CHECK-LABEL: test_vld1q_lane_s8
  return vld1q_lane_s8(a, b, 15);
  // CHECK: ld1 {{{ *v[0-9]+.b *}}}[15], [{{x[0-9]+|sp}}]
}

int16x8_t test_vld1q_lane_s16(int16_t  *a, int16x8_t b) {
  // CHECK-LABEL: test_vld1q_lane_s16
  return vld1q_lane_s16(a, b, 7);
  // CHECK: ld1 {{{ *v[0-9]+.h *}}}[7], [{{x[0-9]+|sp}}]
}

int32x4_t test_vld1q_lane_s32(int32_t  *a, int32x4_t b) {
  // CHECK-LABEL: test_vld1q_lane_s32
  return vld1q_lane_s32(a, b, 3);
  // CHECK: ld1 {{{ *v[0-9]+.s *}}}[3], [{{x[0-9]+|sp}}]
}

int64x2_t test_vld1q_lane_s64(int64_t  *a, int64x2_t b) {
  // CHECK-LABEL: test_vld1q_lane_s64
  return vld1q_lane_s64(a, b, 1);
  // CHECK: ld1 {{{ *v[0-9]+.d *}}}[1], [{{x[0-9]+|sp}}]
}

float16x8_t test_vld1q_lane_f16(float16_t  *a, float16x8_t b) {
  // CHECK-LABEL: test_vld1q_lane_f16
  return vld1q_lane_f16(a, b, 7);
  // CHECK: ld1 {{{ *v[0-9]+.h *}}}[7], [{{x[0-9]+|sp}}]
}

float32x4_t test_vld1q_lane_f32(float32_t  *a, float32x4_t b) {
  // CHECK-LABEL: test_vld1q_lane_f32
  return vld1q_lane_f32(a, b, 3);
  // CHECK: ld1 {{{ *v[0-9]+.s *}}}[3], [{{x[0-9]+|sp}}]
}

float64x2_t test_vld1q_lane_f64(float64_t  *a, float64x2_t b) {
  // CHECK-LABEL: test_vld1q_lane_f64
  return vld1q_lane_f64(a, b, 1);
  // CHECK: ld1 {{{ *v[0-9]+.d *}}}[1], [{{x[0-9]+|sp}}]
}

poly8x16_t test_vld1q_lane_p8(poly8_t  *a, poly8x16_t b) {
  // CHECK-LABEL: test_vld1q_lane_p8
  return vld1q_lane_p8(a, b, 15);
  // CHECK: ld1 {{{ *v[0-9]+.b *}}}[15], [{{x[0-9]+|sp}}]
}

poly16x8_t test_vld1q_lane_p16(poly16_t  *a, poly16x8_t b) {
  // CHECK-LABEL: test_vld1q_lane_p16
  return vld1q_lane_p16(a, b, 7);
  // CHECK: ld1 {{{ *v[0-9]+.h *}}}[7], [{{x[0-9]+|sp}}]
}

poly64x2_t test_vld1q_lane_p64(poly64_t  *a, poly64x2_t b) {
  // CHECK-LABEL: test_vld1q_lane_p64
  return vld1q_lane_p64(a, b, 1);
  // CHECK: ld1 {{{ *v[0-9]+.d *}}}[1], [{{x[0-9]+|sp}}]
}

uint8x8_t test_vld1_lane_u8(uint8_t  *a, uint8x8_t b) {
  // CHECK-LABEL: test_vld1_lane_u8
  return vld1_lane_u8(a, b, 7);
  // CHECK: ld1 {{{ *v[0-9]+.b *}}}[7], [{{x[0-9]+|sp}}]
}

uint16x4_t test_vld1_lane_u16(uint16_t  *a, uint16x4_t b) {
  // CHECK-LABEL: test_vld1_lane_u16
  return vld1_lane_u16(a, b, 3);
  // CHECK: ld1 {{{ *v[0-9]+.h *}}}[3], [{{x[0-9]+|sp}}]
}

uint32x2_t test_vld1_lane_u32(uint32_t  *a, uint32x2_t b) {
  // CHECK-LABEL: test_vld1_lane_u32
  return vld1_lane_u32(a, b, 1);
  // CHECK: ld1 {{{ *v[0-9]+.s *}}}[1], [{{x[0-9]+|sp}}]
}

uint64x1_t test_vld1_lane_u64(uint64_t  *a, uint64x1_t b) {
  // CHECK-LABEL: test_vld1_lane_u64
  return vld1_lane_u64(a, b, 0);
  // CHECK: {{ld1r { v[0-9]+.1d }|ldr d[0-9]+}}, [{{x[0-9]+|sp}}]
}

int8x8_t test_vld1_lane_s8(int8_t  *a, int8x8_t b) {
  // CHECK-LABEL: test_vld1_lane_s8
  return vld1_lane_s8(a, b, 7);
  // CHECK: ld1 {{{ *v[0-9]+.b *}}}[7], [{{x[0-9]+|sp}}]
}

int16x4_t test_vld1_lane_s16(int16_t  *a, int16x4_t b) {
  // CHECK-LABEL: test_vld1_lane_s16
  return vld1_lane_s16(a, b, 3);
  // CHECK: ld1 {{{ *v[0-9]+.h *}}}[3], [{{x[0-9]+|sp}}]
}

int32x2_t test_vld1_lane_s32(int32_t  *a, int32x2_t b) {
  // CHECK-LABEL: test_vld1_lane_s32
  return vld1_lane_s32(a, b, 1);
  // CHECK: ld1 {{{ *v[0-9]+.s *}}}[1], [{{x[0-9]+|sp}}]
}

int64x1_t test_vld1_lane_s64(int64_t  *a, int64x1_t b) {
  // CHECK-LABEL: test_vld1_lane_s64
  return vld1_lane_s64(a, b, 0);
  // CHECK: {{ld1r { v[0-9]+.1d }|ldr d[0-9]+}}, [{{x[0-9]+|sp}}]
}

float16x4_t test_vld1_lane_f16(float16_t  *a, float16x4_t b) {
  // CHECK-LABEL: test_vld1_lane_f16
  return vld1_lane_f16(a, b, 3);
  // CHECK: ld1 {{{ *v[0-9]+.h *}}}[3], [{{x[0-9]+|sp}}]
}

float32x2_t test_vld1_lane_f32(float32_t  *a, float32x2_t b) {
  // CHECK-LABEL: test_vld1_lane_f32
  return vld1_lane_f32(a, b, 1);
  // CHECK: ld1 {{{ *v[0-9]+.s *}}}[1], [{{x[0-9]+|sp}}]
}

float64x1_t test_vld1_lane_f64(float64_t  *a, float64x1_t b) {
  // CHECK-LABEL: test_vld1_lane_f64
  return vld1_lane_f64(a, b, 0);
  // CHECK: {{ld1r { v[0-9]+.1d }|ldr d[0-9]+}}, [{{x[0-9]+|sp}}]
}

poly8x8_t test_vld1_lane_p8(poly8_t  *a, poly8x8_t b) {
  // CHECK-LABEL: test_vld1_lane_p8
  return vld1_lane_p8(a, b, 7);
  // CHECK: ld1 {{{ *v[0-9]+.b *}}}[7], [{{x[0-9]+|sp}}]
}

poly16x4_t test_vld1_lane_p16(poly16_t  *a, poly16x4_t b) {
  // CHECK-LABEL: test_vld1_lane_p16
  return vld1_lane_p16(a, b, 3);
  // CHECK: ld1 {{{ *v[0-9]+.h *}}}[3], [{{x[0-9]+|sp}}]
}

poly64x1_t test_vld1_lane_p64(poly64_t  *a, poly64x1_t b) {
  // CHECK-LABEL: test_vld1_lane_p64
  return vld1_lane_p64(a, b, 0);
  // CHECK: {{ld1r { v[0-9]+.1d }|ldr d[0-9]+}}, [{{x[0-9]+|sp}}]
}

int8x16x2_t test_vld2q_lane_s8(int8_t const * ptr, int8x16x2_t src) {
  // CHECK-LABEL: test_vld2q_lane_s8
  return vld2q_lane_s8(ptr, src, 15);
  // CHECK: ld2 {{{ *v[0-9]+.b,  v[0-9]+.b *}}}[15], [x0]
}

uint8x16x2_t test_vld2q_lane_u8(uint8_t const * ptr, uint8x16x2_t src) {
  // CHECK-LABEL: test_vld2q_lane_u8
  return vld2q_lane_u8(ptr, src, 15);
  // CHECK: ld2 {{{ *v[0-9]+.b, v[0-9]+.b *}}}[15], [x0]
}

poly8x16x2_t test_vld2q_lane_p8(poly8_t const * ptr, poly8x16x2_t src) {
  // CHECK-LABEL: test_vld2q_lane_p8
  return vld2q_lane_p8(ptr, src, 15);
  // CHECK: ld2 {{{ *v[0-9]+.b, v[0-9]+.b *}}}[15], [x0]
}

int8x16x3_t test_vld3q_lane_s8(int8_t const * ptr, int8x16x3_t src) {
  // CHECK-LABEL: test_vld3q_lane_s8
  return vld3q_lane_s8(ptr, src, 15);
  // CHECK: ld3 {{{ *v[0-9]+.b, v[0-9]+.b, v[0-9]+.b *}}}[15], [x0]
}

uint8x16x3_t test_vld3q_lane_u8(uint8_t const * ptr, uint8x16x3_t src) {
  // CHECK-LABEL: test_vld3q_lane_u8
  return vld3q_lane_u8(ptr, src, 15);
  // CHECK: ld3 {{{ *v[0-9]+.b, v[0-9]+.b, v[0-9]+.b *}}}[15], [x0]
}

uint16x8x2_t test_vld2q_lane_u16(uint16_t  *a, uint16x8x2_t b) {
  // CHECK-LABEL: test_vld2q_lane_u16
  return vld2q_lane_u16(a, b, 7);
  // CHECK: ld2 {{{ *v[0-9]+.h, v[0-9]+.h *}}}[7], [{{x[0-9]+|sp}}]
}

uint32x4x2_t test_vld2q_lane_u32(uint32_t  *a, uint32x4x2_t b) {
  // CHECK-LABEL: test_vld2q_lane_u32
  return vld2q_lane_u32(a, b, 3);
  // CHECK: ld2 {{{ *v[0-9]+.s, v[0-9]+.s *}}}[3], [{{x[0-9]+|sp}}]
}

uint64x2x2_t test_vld2q_lane_u64(uint64_t  *a, uint64x2x2_t b) {
  // CHECK-LABEL: test_vld2q_lane_u64
  return vld2q_lane_u64(a, b, 1);
  // CHECK: ld2 {{{ *v[0-9]+.d, v[0-9]+.d *}}}[1], [{{x[0-9]+|sp}}]
}

int16x8x2_t test_vld2q_lane_s16(int16_t  *a, int16x8x2_t b) {
  // CHECK-LABEL: test_vld2q_lane_s16
  return vld2q_lane_s16(a, b, 7);
  // CHECK: ld2 {{{ *v[0-9]+.h, v[0-9]+.h *}}}[7], [{{x[0-9]+|sp}}]
}

int32x4x2_t test_vld2q_lane_s32(int32_t  *a, int32x4x2_t b) {
  // CHECK-LABEL: test_vld2q_lane_s32
  return vld2q_lane_s32(a, b, 3);
  // CHECK: ld2 {{{ *v[0-9]+.s, v[0-9]+.s *}}}[3], [{{x[0-9]+|sp}}]
}

int64x2x2_t test_vld2q_lane_s64(int64_t  *a, int64x2x2_t b) {
  // CHECK-LABEL: test_vld2q_lane_s64
  return vld2q_lane_s64(a, b, 1);
  // CHECK: ld2 {{{ *v[0-9]+.d, v[0-9]+.d *}}}[1], [{{x[0-9]+|sp}}]
}

float16x8x2_t test_vld2q_lane_f16(float16_t  *a, float16x8x2_t b) {
  // CHECK-LABEL: test_vld2q_lane_f16
  return vld2q_lane_f16(a, b, 7);
  // CHECK: ld2 {{{ *v[0-9]+.h, v[0-9]+.h *}}}[7], [{{x[0-9]+|sp}}]
}

float32x4x2_t test_vld2q_lane_f32(float32_t  *a, float32x4x2_t b) {
  // CHECK-LABEL: test_vld2q_lane_f32
  return vld2q_lane_f32(a, b, 3);
  // CHECK: ld2 {{{ *v[0-9]+.s, v[0-9]+.s *}}}[3], [{{x[0-9]+|sp}}]
}

float64x2x2_t test_vld2q_lane_f64(float64_t  *a, float64x2x2_t b) {
  // CHECK-LABEL: test_vld2q_lane_f64
  return vld2q_lane_f64(a, b, 1);
  // CHECK: ld2 {{{ *v[0-9]+.d, v[0-9]+.d *}}}[1], [{{x[0-9]+|sp}}]
}

poly16x8x2_t test_vld2q_lane_p16(poly16_t  *a, poly16x8x2_t b) {
  // CHECK-LABEL: test_vld2q_lane_p16
  return vld2q_lane_p16(a, b, 7);
  // CHECK: ld2 {{{ *v[0-9]+.h, v[0-9]+.h *}}}[7], [{{x[0-9]+|sp}}]
}

poly64x2x2_t test_vld2q_lane_p64(poly64_t  *a, poly64x2x2_t b) {
  // CHECK-LABEL: test_vld2q_lane_p64
  return vld2q_lane_p64(a, b, 1);
  // CHECK: ld2 {{{ *v[0-9]+.d, v[0-9]+.d *}}}[1], [{{x[0-9]+|sp}}]
}

uint8x8x2_t test_vld2_lane_u8(uint8_t  *a, uint8x8x2_t b) {
  // CHECK-LABEL: test_vld2_lane_u8
  return vld2_lane_u8(a, b, 7);
  // CHECK: ld2 {{{ *v[0-9]+.b, v[0-9]+.b *}}}[7], [{{x[0-9]+|sp}}]
}

uint16x4x2_t test_vld2_lane_u16(uint16_t  *a, uint16x4x2_t b) {
  // CHECK-LABEL: test_vld2_lane_u16
  return vld2_lane_u16(a, b, 3);
  // CHECK: ld2 {{{ *v[0-9]+.h, v[0-9]+.h *}}}[3], [{{x[0-9]+|sp}}]
}

uint32x2x2_t test_vld2_lane_u32(uint32_t  *a, uint32x2x2_t b) {
  // CHECK-LABEL: test_vld2_lane_u32
  return vld2_lane_u32(a, b, 1);
  // CHECK: ld2 {{{ *v[0-9]+.s, v[0-9]+.s *}}}[1], [{{x[0-9]+|sp}}]
}

uint64x1x2_t test_vld2_lane_u64(uint64_t  *a, uint64x1x2_t b) {
  // CHECK-LABEL: test_vld2_lane_u64
  return vld2_lane_u64(a, b, 0);
  // CHECK: ld2 {{{ *v[0-9]+.d, v[0-9]+.d *}}}[0], [{{x[0-9]+|sp}}]
}

int8x8x2_t test_vld2_lane_s8(int8_t  *a, int8x8x2_t b) {
  // CHECK-LABEL: test_vld2_lane_s8
  return vld2_lane_s8(a, b, 7);
  // CHECK: ld2 {{{ *v[0-9]+.b, v[0-9]+.b *}}}[7], [{{x[0-9]+|sp}}]
}

int16x4x2_t test_vld2_lane_s16(int16_t  *a, int16x4x2_t b) {
  // CHECK-LABEL: test_vld2_lane_s16
  return vld2_lane_s16(a, b, 3);
  // CHECK: ld2 {{{ *v[0-9]+.h, v[0-9]+.h *}}}[3], [{{x[0-9]+|sp}}]
}

int32x2x2_t test_vld2_lane_s32(int32_t  *a, int32x2x2_t b) {
  // CHECK-LABEL: test_vld2_lane_s32
  return vld2_lane_s32(a, b, 1);
  // CHECK: ld2 {{{ *v[0-9]+.s, v[0-9]+.s *}}}[1], [{{x[0-9]+|sp}}]
}

int64x1x2_t test_vld2_lane_s64(int64_t  *a, int64x1x2_t b) {
  // CHECK-LABEL: test_vld2_lane_s64
  return vld2_lane_s64(a, b, 0);
  // CHECK: ld2 {{{ *v[0-9]+.d, v[0-9]+.d *}}}[0], [{{x[0-9]+|sp}}]
}

float16x4x2_t test_vld2_lane_f16(float16_t  *a, float16x4x2_t b) {
  // CHECK-LABEL: test_vld2_lane_f16
  return vld2_lane_f16(a, b, 3);
  // CHECK: ld2 {{{ *v[0-9]+.h, v[0-9]+.h *}}}[3], [{{x[0-9]+|sp}}]
}

float32x2x2_t test_vld2_lane_f32(float32_t  *a, float32x2x2_t b) {
  // CHECK-LABEL: test_vld2_lane_f32
  return vld2_lane_f32(a, b, 1);
  // CHECK: ld2 {{{ *v[0-9]+.s, v[0-9]+.s *}}}[1], [{{x[0-9]+|sp}}]
}

float64x1x2_t test_vld2_lane_f64(float64_t  *a, float64x1x2_t b) {
  // CHECK-LABEL: test_vld2_lane_f64
  return vld2_lane_f64(a, b, 0);
  // CHECK: ld2 {{{ *v[0-9]+.d, v[0-9]+.d *}}}[0], [{{x[0-9]+|sp}}]
}

poly8x8x2_t test_vld2_lane_p8(poly8_t  *a, poly8x8x2_t b) {
  // CHECK-LABEL: test_vld2_lane_p8
  return vld2_lane_p8(a, b, 7);
  // CHECK: ld2 {{{ *v[0-9]+.b, v[0-9]+.b *}}}[7], [{{x[0-9]+|sp}}]
}

poly16x4x2_t test_vld2_lane_p16(poly16_t  *a, poly16x4x2_t b) {
  // CHECK-LABEL: test_vld2_lane_p16
  return vld2_lane_p16(a, b, 3);
  // CHECK: ld2 {{{ *v[0-9]+.h, v[0-9]+.h *}}}[3], [{{x[0-9]+|sp}}]
}

poly64x1x2_t test_vld2_lane_p64(poly64_t  *a, poly64x1x2_t b) {
  // CHECK-LABEL: test_vld2_lane_p64
  return vld2_lane_p64(a, b, 0);
  // CHECK: ld2 {{{ *v[0-9]+.d, v[0-9]+.d *}}}[0], [{{x[0-9]+|sp}}]
}

uint16x8x3_t test_vld3q_lane_u16(uint16_t  *a, uint16x8x3_t b) {
  // CHECK-LABEL: test_vld3q_lane_u16
  return vld3q_lane_u16(a, b, 7);
  // CHECK: ld3 {{{ *v[0-9]+.h, v[0-9]+.h, v[0-9]+.h *}}}[7], [{{x[0-9]+|sp}}]
}

uint32x4x3_t test_vld3q_lane_u32(uint32_t  *a, uint32x4x3_t b) {
  // CHECK-LABEL: test_vld3q_lane_u32
  return vld3q_lane_u32(a, b, 3);
  // CHECK: ld3 {{{ *v[0-9]+.s, v[0-9]+.s, v[0-9]+.s *}}}[3], [{{x[0-9]+|sp}}]
}

uint64x2x3_t test_vld3q_lane_u64(uint64_t  *a, uint64x2x3_t b) {
  // CHECK-LABEL: test_vld3q_lane_u64
  return vld3q_lane_u64(a, b, 1);
  // CHECK: ld3 {{{ *v[0-9]+.d, v[0-9]+.d, v[0-9]+.d *}}}[1], [{{x[0-9]+|sp}}]
}

int16x8x3_t test_vld3q_lane_s16(int16_t  *a, int16x8x3_t b) {
  // CHECK-LABEL: test_vld3q_lane_s16
  return vld3q_lane_s16(a, b, 7);
  // CHECK: ld3 {{{ *v[0-9]+.h, v[0-9]+.h, v[0-9]+.h *}}}[7], [{{x[0-9]+|sp}}]
}

int32x4x3_t test_vld3q_lane_s32(int32_t  *a, int32x4x3_t b) {
  // CHECK-LABEL: test_vld3q_lane_s32
  return vld3q_lane_s32(a, b, 3);
  // CHECK: ld3 {{{ *v[0-9]+.s, v[0-9]+.s, v[0-9]+.s *}}}[3], [{{x[0-9]+|sp}}]
}

int64x2x3_t test_vld3q_lane_s64(int64_t  *a, int64x2x3_t b) {
  // CHECK-LABEL: test_vld3q_lane_s64
  return vld3q_lane_s64(a, b, 1);
  // CHECK: ld3 {{{ *v[0-9]+.d, v[0-9]+.d, v[0-9]+.d *}}}[1], [{{x[0-9]+|sp}}]
}

float16x8x3_t test_vld3q_lane_f16(float16_t  *a, float16x8x3_t b) {
  // CHECK-LABEL: test_vld3q_lane_f16
  return vld3q_lane_f16(a, b, 7);
  // CHECK: ld3 {{{ *v[0-9]+.h, v[0-9]+.h, v[0-9]+.h *}}}[7], [{{x[0-9]+|sp}}]
}

float32x4x3_t test_vld3q_lane_f32(float32_t  *a, float32x4x3_t b) {
  // CHECK-LABEL: test_vld3q_lane_f32
  return vld3q_lane_f32(a, b, 3);
  // CHECK: ld3 {{{ *v[0-9]+.s, v[0-9]+.s, v[0-9]+.s *}}}[3], [{{x[0-9]+|sp}}]
}

float64x2x3_t test_vld3q_lane_f64(float64_t  *a, float64x2x3_t b) {
  // CHECK-LABEL: test_vld3q_lane_f64
  return vld3q_lane_f64(a, b, 1);
  // CHECK: ld3 {{{ *v[0-9]+.d, v[0-9]+.d, v[0-9]+.d *}}}[1], [{{x[0-9]+|sp}}]
}

poly8x16x3_t test_vld3q_lane_p8(poly8_t  *a, poly8x16x3_t b) {
  // CHECK-LABEL: test_vld3q_lane_p8
  return vld3q_lane_p8(a, b, 15);
  // CHECK: ld3 {{{ *v[0-9]+.b, v[0-9]+.b, v[0-9]+.b *}}}[15], [{{x[0-9]+|sp}}]
}

poly16x8x3_t test_vld3q_lane_p16(poly16_t  *a, poly16x8x3_t b) {
  // CHECK-LABEL: test_vld3q_lane_p16
  return vld3q_lane_p16(a, b, 7);
  // CHECK: ld3 {{{ *v[0-9]+.h, v[0-9]+.h, v[0-9]+.h *}}}[7], [{{x[0-9]+|sp}}]
}

poly64x2x3_t test_vld3q_lane_p64(poly64_t  *a, poly64x2x3_t b) {
  // CHECK-LABEL: test_vld3q_lane_p64
  return vld3q_lane_p64(a, b, 1);
  // CHECK: ld3 {{{ *v[0-9]+.d, v[0-9]+.d, v[0-9]+.d *}}}[1], [{{x[0-9]+|sp}}]
}

uint8x8x3_t test_vld3_lane_u8(uint8_t  *a, uint8x8x3_t b) {
  // CHECK-LABEL: test_vld3_lane_u8
  return vld3_lane_u8(a, b, 7);
  // CHECK: ld3 {{{ *v[0-9]+.b, v[0-9]+.b, v[0-9]+.b *}}}[7], [{{x[0-9]+|sp}}]
}

uint16x4x3_t test_vld3_lane_u16(uint16_t  *a, uint16x4x3_t b) {
  // CHECK-LABEL: test_vld3_lane_u16
  return vld3_lane_u16(a, b, 3);
  // CHECK: ld3 {{{ *v[0-9]+.h, v[0-9]+.h, v[0-9]+.h *}}}[3], [{{x[0-9]+|sp}}]
}

uint32x2x3_t test_vld3_lane_u32(uint32_t  *a, uint32x2x3_t b) {
  // CHECK-LABEL: test_vld3_lane_u32
  return vld3_lane_u32(a, b, 1);
  // CHECK: ld3 {{{ *v[0-9]+.s, v[0-9]+.s, v[0-9]+.s *}}}[1], [{{x[0-9]+|sp}}]
}

uint64x1x3_t test_vld3_lane_u64(uint64_t  *a, uint64x1x3_t b) {
  // CHECK-LABEL: test_vld3_lane_u64
  return vld3_lane_u64(a, b, 0);
  // CHECK: ld3 {{{ *v[0-9]+.d, v[0-9]+.d, v[0-9]+.d *}}}[0], [{{x[0-9]+|sp}}]
}

int8x8x3_t test_vld3_lane_s8(int8_t  *a, int8x8x3_t b) {
  // CHECK-LABEL: test_vld3_lane_s8
  return vld3_lane_s8(a, b, 7);
  // CHECK: ld3 {{{ *v[0-9]+.b, v[0-9]+.b, v[0-9]+.b *}}}[7], [{{x[0-9]+|sp}}]
}

int16x4x3_t test_vld3_lane_s16(int16_t  *a, int16x4x3_t b) {
  // CHECK-LABEL: test_vld3_lane_s16
  return vld3_lane_s16(a, b, 3);
  // CHECK: ld3 {{{ *v[0-9]+.h, v[0-9]+.h, v[0-9]+.h *}}}[3], [{{x[0-9]+|sp}}]
}

int32x2x3_t test_vld3_lane_s32(int32_t  *a, int32x2x3_t b) {
  // CHECK-LABEL: test_vld3_lane_s32
  return vld3_lane_s32(a, b, 1);
  // CHECK: ld3 {{{ *v[0-9]+.s, v[0-9]+.s, v[0-9]+.s *}}}[1], [{{x[0-9]+|sp}}]
}

int64x1x3_t test_vld3_lane_s64(int64_t  *a, int64x1x3_t b) {
  // CHECK-LABEL: test_vld3_lane_s64
  return vld3_lane_s64(a, b, 0);
  // CHECK: ld3 {{{ *v[0-9]+.d, v[0-9]+.d, v[0-9]+.d *}}}[0], [{{x[0-9]+|sp}}]
}

float16x4x3_t test_vld3_lane_f16(float16_t  *a, float16x4x3_t b) {
  // CHECK-LABEL: test_vld3_lane_f16
  return vld3_lane_f16(a, b, 3);
  // CHECK: ld3 {{{ *v[0-9]+.h, v[0-9]+.h, v[0-9]+.h *}}}[3], [{{x[0-9]+|sp}}]
}

float32x2x3_t test_vld3_lane_f32(float32_t  *a, float32x2x3_t b) {
  // CHECK-LABEL: test_vld3_lane_f32
  return vld3_lane_f32(a, b, 1);
  // CHECK: ld3 {{{ *v[0-9]+.s, v[0-9]+.s, v[0-9]+.s *}}}[1], [{{x[0-9]+|sp}}]
}

float64x1x3_t test_vld3_lane_f64(float64_t  *a, float64x1x3_t b) {
  // CHECK-LABEL: test_vld3_lane_f64
  return vld3_lane_f64(a, b, 0);
  // CHECK: ld3 {{{ *v[0-9]+.d, v[0-9]+.d, v[0-9]+.d *}}}[0], [{{x[0-9]+|sp}}]
}

poly8x8x3_t test_vld3_lane_p8(poly8_t  *a, poly8x8x3_t b) {
  // CHECK-LABEL: test_vld3_lane_p8
  return vld3_lane_p8(a, b, 7);
  // CHECK: ld3 {{{ *v[0-9]+.b, v[0-9]+.b, v[0-9]+.b *}}}[7], [{{x[0-9]+|sp}}]
}

poly16x4x3_t test_vld3_lane_p16(poly16_t  *a, poly16x4x3_t b) {
  // CHECK-LABEL: test_vld3_lane_p16
  return vld3_lane_p16(a, b, 3);
  // CHECK: ld3 {{{ *v[0-9]+.h, v[0-9]+.h, v[0-9]+.h *}}}[3], [{{x[0-9]+|sp}}]
}

poly64x1x3_t test_vld3_lane_p64(poly64_t  *a, poly64x1x3_t b) {
  // CHECK-LABEL: test_vld3_lane_p64
  return vld3_lane_p64(a, b, 0);
  // CHECK: ld3 {{{ *v[0-9]+.d, v[0-9]+.d, v[0-9]+.d *}}}[0], [{{x[0-9]+|sp}}]
}

uint8x16x4_t test_vld4q_lane_u8(uint8_t  *a, uint8x16x4_t b) {
  // CHECK-LABEL: test_vld4q_lane_u8
  return vld4q_lane_u8(a, b, 15);
  // CHECK: ld4 {{{ *v[0-9]+.b, v[0-9]+.b, v[0-9]+.b, v[0-9]+.b *}}}[15], [{{x[0-9]+|sp}}]
}

uint16x8x4_t test_vld4q_lane_u16(uint16_t  *a, uint16x8x4_t b) {
  // CHECK-LABEL: test_vld4q_lane_u16
  return vld4q_lane_u16(a, b, 7);
  // CHECK: ld4 {{{ *v[0-9]+.h, v[0-9]+.h, v[0-9]+.h, v[0-9]+.h *}}}[7], [{{x[0-9]+|sp}}]
}

uint32x4x4_t test_vld4q_lane_u32(uint32_t  *a, uint32x4x4_t b) {
  // CHECK-LABEL: test_vld4q_lane_u32
  return vld4q_lane_u32(a, b, 3);
  // CHECK: ld4 {{{ *v[0-9]+.s, v[0-9]+.s, v[0-9]+.s, v[0-9]+.s *}}}[3], [{{x[0-9]+|sp}}]
}

uint64x2x4_t test_vld4q_lane_u64(uint64_t  *a, uint64x2x4_t b) {
  // CHECK-LABEL: test_vld4q_lane_u64
  return vld4q_lane_u64(a, b, 1);
  // CHECK: ld4 {{{ *v[0-9]+.d, v[0-9]+.d, v[0-9]+.d, v[0-9]+.d *}}}[1], [{{x[0-9]+|sp}}]
}

int8x16x4_t test_vld4q_lane_s8(int8_t  *a, int8x16x4_t b) {
  // CHECK-LABEL: test_vld4q_lane_s8
  return vld4q_lane_s8(a, b, 15);
  // CHECK: ld4 {{{ *v[0-9]+.b, v[0-9]+.b, v[0-9]+.b, v[0-9]+.b *}}}[15], [{{x[0-9]+|sp}}]
}

int16x8x4_t test_vld4q_lane_s16(int16_t  *a, int16x8x4_t b) {
  // CHECK-LABEL: test_vld4q_lane_s16
  return vld4q_lane_s16(a, b, 7);
  // CHECK: ld4 {{{ *v[0-9]+.h, v[0-9]+.h, v[0-9]+.h, v[0-9]+.h *}}}[7], [{{x[0-9]+|sp}}]
}

int32x4x4_t test_vld4q_lane_s32(int32_t  *a, int32x4x4_t b) {
  // CHECK-LABEL: test_vld4q_lane_s32
  return vld4q_lane_s32(a, b, 3);
  // CHECK: ld4 {{{ *v[0-9]+.s, v[0-9]+.s, v[0-9]+.s, v[0-9]+.s *}}}[3], [{{x[0-9]+|sp}}]
}

int64x2x4_t test_vld4q_lane_s64(int64_t  *a, int64x2x4_t b) {
  // CHECK-LABEL: test_vld4q_lane_s64
  return vld4q_lane_s64(a, b, 1);
  // CHECK: ld4 {{{ *v[0-9]+.d, v[0-9]+.d, v[0-9]+.d, v[0-9]+.d *}}}[1], [{{x[0-9]+|sp}}]
}

float16x8x4_t test_vld4q_lane_f16(float16_t  *a, float16x8x4_t b) {
  // CHECK-LABEL: test_vld4q_lane_f16
  return vld4q_lane_f16(a, b, 7);
  // CHECK: ld4 {{{ *v[0-9]+.h, v[0-9]+.h, v[0-9]+.h, v[0-9]+.h *}}}[7], [{{x[0-9]+|sp}}]
}

float32x4x4_t test_vld4q_lane_f32(float32_t  *a, float32x4x4_t b) {
  // CHECK-LABEL: test_vld4q_lane_f32
  return vld4q_lane_f32(a, b, 3);
  // CHECK: ld4 {{{ *v[0-9]+.s, v[0-9]+.s, v[0-9]+.s, v[0-9]+.s *}}}[3], [{{x[0-9]+|sp}}]
}

float64x2x4_t test_vld4q_lane_f64(float64_t  *a, float64x2x4_t b) {
  // CHECK-LABEL: test_vld4q_lane_f64
  return vld4q_lane_f64(a, b, 1);
  // CHECK: ld4 {{{ *v[0-9]+.d, v[0-9]+.d, v[0-9]+.d, v[0-9]+.d *}}}[1], [{{x[0-9]+|sp}}]
}

poly8x16x4_t test_vld4q_lane_p8(poly8_t  *a, poly8x16x4_t b) {
  // CHECK-LABEL: test_vld4q_lane_p8
  return vld4q_lane_p8(a, b, 15);
  // CHECK: ld4 {{{ *v[0-9]+.b, v[0-9]+.b, v[0-9]+.b, v[0-9]+.b *}}}[15], [{{x[0-9]+|sp}}]
}

poly16x8x4_t test_vld4q_lane_p16(poly16_t  *a, poly16x8x4_t b) {
  // CHECK-LABEL: test_vld4q_lane_p16
  return vld4q_lane_p16(a, b, 7);
  // CHECK: ld4 {{{ *v[0-9]+.h, v[0-9]+.h, v[0-9]+.h, v[0-9]+.h *}}}[7], [{{x[0-9]+|sp}}]
}

poly64x2x4_t test_vld4q_lane_p64(poly64_t  *a, poly64x2x4_t b) {
  // CHECK-LABEL: test_vld4q_lane_p64
  return vld4q_lane_p64(a, b, 1);
  // CHECK: ld4 {{{ *v[0-9]+.d, v[0-9]+.d, v[0-9]+.d, v[0-9]+.d *}}}[1], [{{x[0-9]+|sp}}]
}

uint8x8x4_t test_vld4_lane_u8(uint8_t  *a, uint8x8x4_t b) {
  // CHECK-LABEL: test_vld4_lane_u8
  return vld4_lane_u8(a, b, 7);
  // CHECK: ld4 {{{ *v[0-9]+.b, v[0-9]+.b, v[0-9]+.b, v[0-9]+.b *}}}[7], [{{x[0-9]+|sp}}]
}

uint16x4x4_t test_vld4_lane_u16(uint16_t  *a, uint16x4x4_t b) {
  // CHECK-LABEL: test_vld4_lane_u16
  return vld4_lane_u16(a, b, 3);
  // CHECK: ld4 {{{ *v[0-9]+.h, v[0-9]+.h, v[0-9]+.h, v[0-9]+.h *}}}[3], [{{x[0-9]+|sp}}]
}

uint32x2x4_t test_vld4_lane_u32(uint32_t  *a, uint32x2x4_t b) {
  // CHECK-LABEL: test_vld4_lane_u32
  return vld4_lane_u32(a, b, 1);
  // CHECK: ld4 {{{ *v[0-9]+.s, v[0-9]+.s, v[0-9]+.s, v[0-9]+.s *}}}[1], [{{x[0-9]+|sp}}]
}

uint64x1x4_t test_vld4_lane_u64(uint64_t  *a, uint64x1x4_t b) {
  // CHECK-LABEL: test_vld4_lane_u64
  return vld4_lane_u64(a, b, 0);
  // CHECK: ld4 {{{ *v[0-9]+.d, v[0-9]+.d, v[0-9]+.d, v[0-9]+.d *}}}[0], [{{x[0-9]+|sp}}]
}

int8x8x4_t test_vld4_lane_s8(int8_t  *a, int8x8x4_t b) {
  // CHECK-LABEL: test_vld4_lane_s8
  return vld4_lane_s8(a, b, 7);
  // CHECK: ld4 {{{ *v[0-9]+.b, v[0-9]+.b, v[0-9]+.b, v[0-9]+.b *}}}[7], [{{x[0-9]+|sp}}]
}

int16x4x4_t test_vld4_lane_s16(int16_t  *a, int16x4x4_t b) {
  // CHECK-LABEL: test_vld4_lane_s16
  return vld4_lane_s16(a, b, 3);
  // CHECK: ld4 {{{ *v[0-9]+.h, v[0-9]+.h, v[0-9]+.h, v[0-9]+.h *}}}[3], [{{x[0-9]+|sp}}]
}

int32x2x4_t test_vld4_lane_s32(int32_t  *a, int32x2x4_t b) {
  // CHECK-LABEL: test_vld4_lane_s32
  return vld4_lane_s32(a, b, 1);
  // CHECK: ld4 {{{ *v[0-9]+.s, v[0-9]+.s, v[0-9]+.s, v[0-9]+.s *}}}[1], [{{x[0-9]+|sp}}]
}

int64x1x4_t test_vld4_lane_s64(int64_t  *a, int64x1x4_t b) {
  // CHECK-LABEL: test_vld4_lane_s64
  return vld4_lane_s64(a, b, 0);
  // CHECK: ld4 {{{ *v[0-9]+.d, v[0-9]+.d, v[0-9]+.d, v[0-9]+.d *}}}[0], [{{x[0-9]+|sp}}]
}

float16x4x4_t test_vld4_lane_f16(float16_t  *a, float16x4x4_t b) {
  // CHECK-LABEL: test_vld4_lane_f16
  return vld4_lane_f16(a, b, 3);
  // CHECK: ld4 {{{ *v[0-9]+.h, v[0-9]+.h, v[0-9]+.h, v[0-9]+.h *}}}[3], [{{x[0-9]+|sp}}]
}

float32x2x4_t test_vld4_lane_f32(float32_t  *a, float32x2x4_t b) {
  // CHECK-LABEL: test_vld4_lane_f32
  return vld4_lane_f32(a, b, 1);
  // CHECK: ld4 {{{ *v[0-9]+.s, v[0-9]+.s, v[0-9]+.s, v[0-9]+.s *}}}[1], [{{x[0-9]+|sp}}]
}

float64x1x4_t test_vld4_lane_f64(float64_t  *a, float64x1x4_t b) {
  // CHECK-LABEL: test_vld4_lane_f64
  return vld4_lane_f64(a, b, 0);
  // CHECK: ld4 {{{ *v[0-9]+.d, v[0-9]+.d, v[0-9]+.d, v[0-9]+.d *}}}[0], [{{x[0-9]+|sp}}]
}

poly8x8x4_t test_vld4_lane_p8(poly8_t  *a, poly8x8x4_t b) {
  // CHECK-LABEL: test_vld4_lane_p8
  return vld4_lane_p8(a, b, 7);
  // CHECK: ld4 {{{ *v[0-9]+.b, v[0-9]+.b, v[0-9]+.b, v[0-9]+.b *}}}[7], [{{x[0-9]+|sp}}]
}

poly16x4x4_t test_vld4_lane_p16(poly16_t  *a, poly16x4x4_t b) {
  // CHECK-LABEL: test_vld4_lane_p16
  return vld4_lane_p16(a, b, 3);
  // CHECK: ld4 {{{ *v[0-9]+.h, v[0-9]+.h, v[0-9]+.h, v[0-9]+.h *}}}[3], [{{x[0-9]+|sp}}]
}

poly64x1x4_t test_vld4_lane_p64(poly64_t  *a, poly64x1x4_t b) {
  // CHECK-LABEL: test_vld4_lane_p64
  return vld4_lane_p64(a, b, 0);
  // CHECK: ld4 {{{ *v[0-9]+.d, v[0-9]+.d, v[0-9]+.d, v[0-9]+.d *}}}[0], [{{x[0-9]+|sp}}]
}

void test_vst1q_lane_u8(uint8_t  *a, uint8x16_t b) {
  // CHECK-LABEL: test_vst1q_lane_u8
  vst1q_lane_u8(a, b, 15);
  // CHECK: st1 {{{ *v[0-9]+.b *}}}[15], [{{x[0-9]+|sp}}]
}

void test_vst1q_lane_u16(uint16_t  *a, uint16x8_t b) {
  // CHECK-LABEL: test_vst1q_lane_u16
  vst1q_lane_u16(a, b, 7);
  // CHECK: st1 {{{ *v[0-9]+.h *}}}[7], [{{x[0-9]+|sp}}]
}

void test_vst1q_lane_u32(uint32_t  *a, uint32x4_t b) {
  // CHECK-LABEL: test_vst1q_lane_u32
  vst1q_lane_u32(a, b, 3);
  // CHECK: st1 {{{ *v[0-9]+.s *}}}[3], [{{x[0-9]+|sp}}]
}

void test_vst1q_lane_u64(uint64_t  *a, uint64x2_t b) {
  // CHECK-LABEL: test_vst1q_lane_u64
  vst1q_lane_u64(a, b, 1);
  // CHECK: st1 {{{ *v[0-9]+.d *}}}[1], [{{x[0-9]+|sp}}]
}

void test_vst1q_lane_s8(int8_t  *a, int8x16_t b) {
  // CHECK-LABEL: test_vst1q_lane_s8
  vst1q_lane_s8(a, b, 15);
  // CHECK: st1 {{{ *v[0-9]+.b *}}}[15], [{{x[0-9]+|sp}}]
}

void test_vst1q_lane_s16(int16_t  *a, int16x8_t b) {
  // CHECK-LABEL: test_vst1q_lane_s16
  vst1q_lane_s16(a, b, 7);
  // CHECK: st1 {{{ *v[0-9]+.h *}}}[7], [{{x[0-9]+|sp}}]
}

void test_vst1q_lane_s32(int32_t  *a, int32x4_t b) {
  // CHECK-LABEL: test_vst1q_lane_s32
  vst1q_lane_s32(a, b, 3);
  // CHECK: st1 {{{ *v[0-9]+.s *}}}[3], [{{x[0-9]+|sp}}]
}

void test_vst1q_lane_s64(int64_t  *a, int64x2_t b) {
  // CHECK-LABEL: test_vst1q_lane_s64
  vst1q_lane_s64(a, b, 1);
  // CHECK: st1 {{{ *v[0-9]+.d *}}}[1], [{{x[0-9]+|sp}}]
}

void test_vst1q_lane_f16(float16_t  *a, float16x8_t b) {
  // CHECK-LABEL: test_vst1q_lane_f16
  vst1q_lane_f16(a, b, 7);
  // CHECK: st1 {{{ *v[0-9]+.h *}}}[7], [{{x[0-9]+|sp}}]
}

void test_vst1q_lane_f32(float32_t  *a, float32x4_t b) {
  // CHECK-LABEL: test_vst1q_lane_f32
  vst1q_lane_f32(a, b, 3);
  // CHECK: st1 {{{ *v[0-9]+.s *}}}[3], [{{x[0-9]+|sp}}]
}

void test_vst1q_lane_f64(float64_t  *a, float64x2_t b) {
  // CHECK-LABEL: test_vst1q_lane_f64
  vst1q_lane_f64(a, b, 1);
  // CHECK: st1 {{{ *v[0-9]+.d *}}}[1], [{{x[0-9]+|sp}}]
}

void test_vst1q_lane_p8(poly8_t  *a, poly8x16_t b) {
  // CHECK-LABEL: test_vst1q_lane_p8
  vst1q_lane_p8(a, b, 15);
  // CHECK: st1 {{{ *v[0-9]+.b *}}}[15], [{{x[0-9]+|sp}}]
}

void test_vst1q_lane_p16(poly16_t  *a, poly16x8_t b) {
  // CHECK-LABEL: test_vst1q_lane_p16
  vst1q_lane_p16(a, b, 7);
  // CHECK: st1 {{{ *v[0-9]+.h *}}}[7], [{{x[0-9]+|sp}}]
}

void test_vst1q_lane_p64(poly64_t  *a, poly64x2_t b) {
  // CHECK-LABEL: test_vst1q_lane_p64
  vst1q_lane_p64(a, b, 1);
  // CHECK: st1 {{{ *v[0-9]+.d *}}}[1], [{{x[0-9]+|sp}}]
}

void test_vst1_lane_u8(uint8_t  *a, uint8x8_t b) {
  // CHECK-LABEL: test_vst1_lane_u8
  vst1_lane_u8(a, b, 7);
  // CHECK: st1 {{{ *v[0-9]+.b *}}}[7], [{{x[0-9]+|sp}}]
}

void test_vst1_lane_u16(uint16_t  *a, uint16x4_t b) {
  // CHECK-LABEL: test_vst1_lane_u16
  vst1_lane_u16(a, b, 3);
  // CHECK: st1 {{{ *v[0-9]+.h *}}}[3], [{{x[0-9]+|sp}}]
}

void test_vst1_lane_u32(uint32_t  *a, uint32x2_t b) {
  // CHECK-LABEL: test_vst1_lane_u32
  vst1_lane_u32(a, b, 1);
  // CHECK: st1 {{{ *v[0-9]+.s *}}}[1], [{{x[0-9]+|sp}}]
}

void test_vst1_lane_u64(uint64_t  *a, uint64x1_t b) {
  // CHECK-LABEL: test_vst1_lane_u64
  vst1_lane_u64(a, b, 0);
  // CHECK: st1 {{{ *v[0-9]+.d *}}}[0], [{{x[0-9]+|sp}}]
}

void test_vst1_lane_s8(int8_t  *a, int8x8_t b) {
  // CHECK-LABEL: test_vst1_lane_s8
  vst1_lane_s8(a, b, 7);
  // CHECK: st1 {{{ *v[0-9]+.b *}}}[7], [{{x[0-9]+|sp}}]
}

void test_vst1_lane_s16(int16_t  *a, int16x4_t b) {
  // CHECK-LABEL: test_vst1_lane_s16
  vst1_lane_s16(a, b, 3);
  // CHECK: st1 {{{ *v[0-9]+.h *}}}[3], [{{x[0-9]+|sp}}]
}

void test_vst1_lane_s32(int32_t  *a, int32x2_t b) {
  // CHECK-LABEL: test_vst1_lane_s32
  vst1_lane_s32(a, b, 1);
  // CHECK: st1 {{{ *v[0-9]+.s *}}}[1], [{{x[0-9]+|sp}}]
}

void test_vst1_lane_s64(int64_t  *a, int64x1_t b) {
  // CHECK-LABEL: test_vst1_lane_s64
  vst1_lane_s64(a, b, 0);
  // CHECK: st1 {{{ *v[0-9]+.d *}}}[0], [{{x[0-9]+|sp}}]
}

void test_vst1_lane_f16(float16_t  *a, float16x4_t b) {
  // CHECK-LABEL: test_vst1_lane_f16
  vst1_lane_f16(a, b, 3);
  // CHECK: st1 {{{ *v[0-9]+.h *}}}[3], [{{x[0-9]+|sp}}]
}

void test_vst1_lane_f32(float32_t  *a, float32x2_t b) {
  // CHECK-LABEL: test_vst1_lane_f32
  vst1_lane_f32(a, b, 1);
  // CHECK: st1 {{{ *v[0-9]+.s *}}}[1], [{{x[0-9]+|sp}}]
}

void test_vst1_lane_f64(float64_t  *a, float64x1_t b) {
  // CHECK-LABEL: test_vst1_lane_f64
  vst1_lane_f64(a, b, 0);
  // CHECK: {{st1 { v[0-9]+.d }\[0]|str d[0-9]+}}, [{{x[0-9]+|sp}}]
}

void test_vst1_lane_p8(poly8_t  *a, poly8x8_t b) {
  // CHECK-LABEL: test_vst1_lane_p8
  vst1_lane_p8(a, b, 7);
  // CHECK: st1 {{{ *v[0-9]+.b *}}}[7], [{{x[0-9]+|sp}}]
}

void test_vst1_lane_p16(poly16_t  *a, poly16x4_t b) {
  // CHECK-LABEL: test_vst1_lane_p16
  vst1_lane_p16(a, b, 3);
  // CHECK: st1 {{{ *v[0-9]+.h *}}}[3], [{{x[0-9]+|sp}}]
}

void test_vst1_lane_p64(poly64_t  *a, poly64x1_t b) {
  // CHECK-LABEL: test_vst1_lane_p64
  vst1_lane_p64(a, b, 0);
  // CHECK: st1 {{{ *v[0-9]+.d *}}}[0], [{{x[0-9]+|sp}}]
}

void test_vst2q_lane_u8(uint8_t  *a, uint8x16x2_t b) {
  // CHECK-LABEL: test_vst2q_lane_u8
  vst2q_lane_u8(a, b, 15);
  // CHECK: st2 {{{ *v[0-9]+.b, v[0-9]+.b *}}}[15], [{{x[0-9]+|sp}}]
}

void test_vst2q_lane_u16(uint16_t  *a, uint16x8x2_t b) {
  // CHECK-LABEL: test_vst2q_lane_u16
  vst2q_lane_u16(a, b, 7);
  // CHECK: st2 {{{ *v[0-9]+.h, v[0-9]+.h *}}}[7], [{{x[0-9]+|sp}}]
}

void test_vst2q_lane_u32(uint32_t  *a, uint32x4x2_t b) {
  // CHECK-LABEL: test_vst2q_lane_u32
  vst2q_lane_u32(a, b, 3);
  // CHECK: st2 {{{ *v[0-9]+.s, v[0-9]+.s *}}}[3], [{{x[0-9]+|sp}}]
}

void test_vst2q_lane_u64(uint64_t  *a, uint64x2x2_t b) {
  // CHECK-LABEL: test_vst2q_lane_u64
  vst2q_lane_u64(a, b, 1);
  // CHECK: st2 {{{ *v[0-9]+.d, v[0-9]+.d *}}}[1], [{{x[0-9]+|sp}}]
}

void test_vst2q_lane_s8(int8_t  *a, int8x16x2_t b) {
  // CHECK-LABEL: test_vst2q_lane_s8
  vst2q_lane_s8(a, b, 15);
  // CHECK: st2 {{{ *v[0-9]+.b, v[0-9]+.b *}}}[15], [{{x[0-9]+|sp}}]
}

void test_vst2q_lane_s16(int16_t  *a, int16x8x2_t b) {
  // CHECK-LABEL: test_vst2q_lane_s16
  vst2q_lane_s16(a, b, 7);
  // CHECK: st2 {{{ *v[0-9]+.h, v[0-9]+.h *}}}[7], [{{x[0-9]+|sp}}]
}

void test_vst2q_lane_s32(int32_t  *a, int32x4x2_t b) {
  // CHECK-LABEL: test_vst2q_lane_s32
  vst2q_lane_s32(a, b, 3);
  // CHECK: st2 {{{ *v[0-9]+.s, v[0-9]+.s *}}}[3], [{{x[0-9]+|sp}}]
}

void test_vst2q_lane_s64(int64_t  *a, int64x2x2_t b) {
  // CHECK-LABEL: test_vst2q_lane_s64
  vst2q_lane_s64(a, b, 1);
  // CHECK: st2 {{{ *v[0-9]+.d, v[0-9]+.d *}}}[1], [{{x[0-9]+|sp}}]
}

void test_vst2q_lane_f16(float16_t  *a, float16x8x2_t b) {
  // CHECK-LABEL: test_vst2q_lane_f16
  vst2q_lane_f16(a, b, 7);
  // CHECK: st2 {{{ *v[0-9]+.h, v[0-9]+.h *}}}[7], [{{x[0-9]+|sp}}]
}

void test_vst2q_lane_f32(float32_t  *a, float32x4x2_t b) {
  // CHECK-LABEL: test_vst2q_lane_f32
  vst2q_lane_f32(a, b, 3);
  // CHECK: st2 {{{ *v[0-9]+.s, v[0-9]+.s *}}}[3], [{{x[0-9]+|sp}}]
}

void test_vst2q_lane_f64(float64_t  *a, float64x2x2_t b) {
  // CHECK-LABEL: test_vst2q_lane_f64
  vst2q_lane_f64(a, b, 1);
  // CHECK: st2 {{{ *v[0-9]+.d, v[0-9]+.d *}}}[1], [{{x[0-9]+|sp}}]
}

void test_vst2q_lane_p8(poly8_t  *a, poly8x16x2_t b) {
  // CHECK-LABEL: test_vst2q_lane_p8
  vst2q_lane_p8(a, b, 15);
  // CHECK: st2 {{{ *v[0-9]+.b, v[0-9]+.b *}}}[15], [{{x[0-9]+|sp}}]
}

void test_vst2q_lane_p16(poly16_t  *a, poly16x8x2_t b) {
  // CHECK-LABEL: test_vst2q_lane_p16
  vst2q_lane_p16(a, b, 7);
  // CHECK: st2 {{{ *v[0-9]+.h, v[0-9]+.h *}}}[7], [{{x[0-9]+|sp}}]
}

void test_vst2q_lane_p64(poly64_t  *a, poly64x2x2_t b) {
  // CHECK-LABEL: test_vst2q_lane_p64
  vst2q_lane_p64(a, b, 1);
  // CHECK: st2 {{{ *v[0-9]+.d, v[0-9]+.d *}}}[1], [{{x[0-9]+|sp}}]
}

void test_vst2_lane_u8(uint8_t  *a, uint8x8x2_t b) {
  // CHECK-LABEL: test_vst2_lane_u8
  vst2_lane_u8(a, b, 7);
  // CHECK: st2 {{{ *v[0-9]+.b, v[0-9]+.b *}}}[7], [{{x[0-9]+|sp}}]
}

void test_vst2_lane_u16(uint16_t  *a, uint16x4x2_t b) {
  // CHECK-LABEL: test_vst2_lane_u16
  vst2_lane_u16(a, b, 3);
  // CHECK: st2 {{{ *v[0-9]+.h, v[0-9]+.h *}}}[3], [{{x[0-9]+|sp}}]
}

void test_vst2_lane_u32(uint32_t  *a, uint32x2x2_t b) {
  // CHECK-LABEL: test_vst2_lane_u32
  vst2_lane_u32(a, b, 1);
  // CHECK: st2 {{{ *v[0-9]+.s, v[0-9]+.s *}}}[1], [{{x[0-9]+|sp}}]
}

void test_vst2_lane_u64(uint64_t  *a, uint64x1x2_t b) {
  // CHECK-LABEL: test_vst2_lane_u64
  vst2_lane_u64(a, b, 0);
  // CHECK: st2 {{{ *v[0-9]+.d, v[0-9]+.d *}}}[0], [{{x[0-9]+|sp}}]
}

void test_vst2_lane_s8(int8_t  *a, int8x8x2_t b) {
  // CHECK-LABEL: test_vst2_lane_s8
  vst2_lane_s8(a, b, 7);
  // CHECK: st2 {{{ *v[0-9]+.b, v[0-9]+.b *}}}[7], [{{x[0-9]+|sp}}]
}

void test_vst2_lane_s16(int16_t  *a, int16x4x2_t b) {
  // CHECK-LABEL: test_vst2_lane_s16
  vst2_lane_s16(a, b, 3);
  // CHECK: st2 {{{ *v[0-9]+.h, v[0-9]+.h *}}}[3], [{{x[0-9]+|sp}}]
}

void test_vst2_lane_s32(int32_t  *a, int32x2x2_t b) {
  // CHECK-LABEL: test_vst2_lane_s32
  vst2_lane_s32(a, b, 1);
  // CHECK: st2 {{{ *v[0-9]+.s, v[0-9]+.s *}}}[1], [{{x[0-9]+|sp}}]
}

void test_vst2_lane_s64(int64_t  *a, int64x1x2_t b) {
  // CHECK-LABEL: test_vst2_lane_s64
  vst2_lane_s64(a, b, 0);
  // CHECK: st2 {{{ *v[0-9]+.d, v[0-9]+.d *}}}[0], [{{x[0-9]+|sp}}]
}

void test_vst2_lane_f16(float16_t  *a, float16x4x2_t b) {
  // CHECK-LABEL: test_vst2_lane_f16
  vst2_lane_f16(a, b, 3);
  // CHECK: st2 {{{ *v[0-9]+.h, v[0-9]+.h *}}}[3], [{{x[0-9]+|sp}}]
}

void test_vst2_lane_f32(float32_t  *a, float32x2x2_t b) {
  // CHECK-LABEL: test_vst2_lane_f32
  vst2_lane_f32(a, b, 1);
  // CHECK: st2 {{{ *v[0-9]+.s, v[0-9]+.s *}}}[1], [{{x[0-9]+|sp}}]
}

void test_vst2_lane_f64(float64_t  *a, float64x1x2_t b) {
  // CHECK-LABEL: test_vst2_lane_f64
  vst2_lane_f64(a, b, 0);
  // CHECK: st2 {{{ *v[0-9]+.d, v[0-9]+.d *}}}[0], [{{x[0-9]+|sp}}]
}

void test_vst2_lane_p8(poly8_t  *a, poly8x8x2_t b) {
  // CHECK-LABEL: test_vst2_lane_p8
  vst2_lane_p8(a, b, 7);
  // CHECK: st2 {{{ *v[0-9]+.b, v[0-9]+.b *}}}[7], [{{x[0-9]+|sp}}]
}

void test_vst2_lane_p16(poly16_t  *a, poly16x4x2_t b) {
  // CHECK-LABEL: test_vst2_lane_p16
  vst2_lane_p16(a, b, 3);
  // CHECK: st2 {{{ *v[0-9]+.h, v[0-9]+.h *}}}[3], [{{x[0-9]+|sp}}]
}

void test_vst2_lane_p64(poly64_t  *a, poly64x1x2_t b) {
  // CHECK-LABEL: test_vst2_lane_p64
  vst2_lane_p64(a, b, 0);
  // CHECK: st2 {{{ *v[0-9]+.d, v[0-9]+.d *}}}[0], [{{x[0-9]+|sp}}]
}

void test_vst3q_lane_u8(uint8_t  *a, uint8x16x3_t b) {
  // CHECK-LABEL: test_vst3q_lane_u8
  vst3q_lane_u8(a, b, 15);
  // CHECK: st3 {{{ *v[0-9]+.b, v[0-9]+.b, v[0-9]+.b *}}}[15], [{{x[0-9]+|sp}}]
}

void test_vst3q_lane_u16(uint16_t  *a, uint16x8x3_t b) {
  // CHECK-LABEL: test_vst3q_lane_u16
  vst3q_lane_u16(a, b, 7);
  // CHECK: st3 {{{ *v[0-9]+.h, v[0-9]+.h, v[0-9]+.h *}}}[7], [{{x[0-9]+|sp}}]
}

void test_vst3q_lane_u32(uint32_t  *a, uint32x4x3_t b) {
  // CHECK-LABEL: test_vst3q_lane_u32
  vst3q_lane_u32(a, b, 3);
  // CHECK: st3 {{{ *v[0-9]+.s, v[0-9]+.s, v[0-9]+.s *}}}[3], [{{x[0-9]+|sp}}]
}

void test_vst3q_lane_u64(uint64_t  *a, uint64x2x3_t b) {
  // CHECK-LABEL: test_vst3q_lane_u64
  vst3q_lane_u64(a, b, 1);
  // CHECK: st3 {{{ *v[0-9]+.d, v[0-9]+.d, v[0-9]+.d *}}}[1], [{{x[0-9]+|sp}}]
}

void test_vst3q_lane_s8(int8_t  *a, int8x16x3_t b) {
  // CHECK-LABEL: test_vst3q_lane_s8
  vst3q_lane_s8(a, b, 15);
  // CHECK: st3 {{{ *v[0-9]+.b, v[0-9]+.b, v[0-9]+.b *}}}[15], [{{x[0-9]+|sp}}]
}

void test_vst3q_lane_s16(int16_t  *a, int16x8x3_t b) {
  // CHECK-LABEL: test_vst3q_lane_s16
  vst3q_lane_s16(a, b, 7);
  // CHECK: st3 {{{ *v[0-9]+.h, v[0-9]+.h, v[0-9]+.h *}}}[7], [{{x[0-9]+|sp}}]
}

void test_vst3q_lane_s32(int32_t  *a, int32x4x3_t b) {
  // CHECK-LABEL: test_vst3q_lane_s32
  vst3q_lane_s32(a, b, 3);
  // CHECK: st3 {{{ *v[0-9]+.s, v[0-9]+.s, v[0-9]+.s *}}}[3], [{{x[0-9]+|sp}}]
}

void test_vst3q_lane_s64(int64_t  *a, int64x2x3_t b) {
  // CHECK-LABEL: test_vst3q_lane_s64
  vst3q_lane_s64(a, b, 1);
  // CHECK: st3 {{{ *v[0-9]+.d, v[0-9]+.d, v[0-9]+.d *}}}[1], [{{x[0-9]+|sp}}]
}

void test_vst3q_lane_f16(float16_t  *a, float16x8x3_t b) {
  // CHECK-LABEL: test_vst3q_lane_f16
  vst3q_lane_f16(a, b, 7);
  // CHECK: st3 {{{ *v[0-9]+.h, v[0-9]+.h, v[0-9]+.h *}}}[7], [{{x[0-9]+|sp}}]
}

void test_vst3q_lane_f32(float32_t  *a, float32x4x3_t b) {
  // CHECK-LABEL: test_vst3q_lane_f32
  vst3q_lane_f32(a, b, 3);
  // CHECK: st3 {{{ *v[0-9]+.s, v[0-9]+.s, v[0-9]+.s *}}}[3], [{{x[0-9]+|sp}}]
}

void test_vst3q_lane_f64(float64_t  *a, float64x2x3_t b) {
  // CHECK-LABEL: test_vst3q_lane_f64
  vst3q_lane_f64(a, b, 1);
  // CHECK: st3 {{{ *v[0-9]+.d, v[0-9]+.d, v[0-9]+.d *}}}[1], [{{x[0-9]+|sp}}]
}

void test_vst3q_lane_p8(poly8_t  *a, poly8x16x3_t b) {
  // CHECK-LABEL: test_vst3q_lane_p8
  vst3q_lane_p8(a, b, 15);
  // CHECK: st3 {{{ *v[0-9]+.b, v[0-9]+.b, v[0-9]+.b *}}}[15], [{{x[0-9]+|sp}}]
}

void test_vst3q_lane_p16(poly16_t  *a, poly16x8x3_t b) {
  // CHECK-LABEL: test_vst3q_lane_p16
  vst3q_lane_p16(a, b, 7);
  // CHECK: st3 {{{ *v[0-9]+.h, v[0-9]+.h, v[0-9]+.h *}}}[7], [{{x[0-9]+|sp}}]
}

void test_vst3q_lane_p64(poly64_t  *a, poly64x2x3_t b) {
  // CHECK-LABEL: test_vst3q_lane_p64
  vst3q_lane_p64(a, b, 1);
  // CHECK: st3 {{{ *v[0-9]+.d, v[0-9]+.d, v[0-9]+.d *}}}[1], [{{x[0-9]+|sp}}]
}

void test_vst3_lane_u8(uint8_t  *a, uint8x8x3_t b) {
  // CHECK-LABEL: test_vst3_lane_u8
  vst3_lane_u8(a, b, 7);
  // CHECK: st3 {{{ *v[0-9]+.b, v[0-9]+.b, v[0-9]+.b *}}}[7], [{{x[0-9]+|sp}}]
}

void test_vst3_lane_u16(uint16_t  *a, uint16x4x3_t b) {
  // CHECK-LABEL: test_vst3_lane_u16
  vst3_lane_u16(a, b, 3);
  // CHECK: st3 {{{ *v[0-9]+.h, v[0-9]+.h, v[0-9]+.h *}}}[3], [{{x[0-9]+|sp}}]
}

void test_vst3_lane_u32(uint32_t  *a, uint32x2x3_t b) {
  // CHECK-LABEL: test_vst3_lane_u32
  vst3_lane_u32(a, b, 1);
  // CHECK: st3 {{{ *v[0-9]+.s, v[0-9]+.s, v[0-9]+.s *}}}[1], [{{x[0-9]+|sp}}]
}

void test_vst3_lane_u64(uint64_t  *a, uint64x1x3_t b) {
  // CHECK-LABEL: test_vst3_lane_u64
  vst3_lane_u64(a, b, 0);
  // CHECK: st3 {{{ *v[0-9]+.d, v[0-9]+.d, v[0-9]+.d *}}}[0], [{{x[0-9]+|sp}}]
}

void test_vst3_lane_s8(int8_t  *a, int8x8x3_t b) {
  // CHECK-LABEL: test_vst3_lane_s8
  vst3_lane_s8(a, b, 7);
  // CHECK: st3 {{{ *v[0-9]+.b, v[0-9]+.b, v[0-9]+.b *}}}[7], [{{x[0-9]+|sp}}]
}

void test_vst3_lane_s16(int16_t  *a, int16x4x3_t b) {
  // CHECK-LABEL: test_vst3_lane_s16
  vst3_lane_s16(a, b, 3);
  // CHECK: st3 {{{ *v[0-9]+.h, v[0-9]+.h, v[0-9]+.h *}}}[3], [{{x[0-9]+|sp}}]
}

void test_vst3_lane_s32(int32_t  *a, int32x2x3_t b) {
  // CHECK-LABEL: test_vst3_lane_s32
  vst3_lane_s32(a, b, 1);
  // CHECK: st3 {{{ *v[0-9]+.s, v[0-9]+.s, v[0-9]+.s *}}}[1], [{{x[0-9]+|sp}}]
}

void test_vst3_lane_s64(int64_t  *a, int64x1x3_t b) {
  // CHECK-LABEL: test_vst3_lane_s64
  vst3_lane_s64(a, b, 0);
  // CHECK: st3 {{{ *v[0-9]+.d, v[0-9]+.d, v[0-9]+.d *}}}[0], [{{x[0-9]+|sp}}]
}

void test_vst3_lane_f16(float16_t  *a, float16x4x3_t b) {
  // CHECK-LABEL: test_vst3_lane_f16
  vst3_lane_f16(a, b, 3);
  // CHECK: st3 {{{ *v[0-9]+.h, v[0-9]+.h, v[0-9]+.h *}}}[3], [{{x[0-9]+|sp}}]
}

void test_vst3_lane_f32(float32_t  *a, float32x2x3_t b) {
  // CHECK-LABEL: test_vst3_lane_f32
  vst3_lane_f32(a, b, 1);
  // CHECK: st3 {{{ *v[0-9]+.s, v[0-9]+.s, v[0-9]+.s *}}}[1], [{{x[0-9]+|sp}}]
}

void test_vst3_lane_f64(float64_t  *a, float64x1x3_t b) {
  // CHECK-LABEL: test_vst3_lane_f64
  vst3_lane_f64(a, b, 0);
  // CHECK: st3 {{{ *v[0-9]+.d, v[0-9]+.d, v[0-9]+.d *}}}[0], [{{x[0-9]+|sp}}]
}

void test_vst3_lane_p8(poly8_t  *a, poly8x8x3_t b) {
  // CHECK-LABEL: test_vst3_lane_p8
  vst3_lane_p8(a, b, 7);
  // CHECK: st3 {{{ *v[0-9]+.b, v[0-9]+.b, v[0-9]+.b *}}}[7], [{{x[0-9]+|sp}}]
}

void test_vst3_lane_p16(poly16_t  *a, poly16x4x3_t b) {
  // CHECK-LABEL: test_vst3_lane_p16
  vst3_lane_p16(a, b, 3);
  // CHECK: st3 {{{ *v[0-9]+.h, v[0-9]+.h, v[0-9]+.h *}}}[3], [{{x[0-9]+|sp}}]
}

void test_vst3_lane_p64(poly64_t  *a, poly64x1x3_t b) {
  // CHECK-LABEL: test_vst3_lane_p64
  vst3_lane_p64(a, b, 0);
  // CHECK: st3 {{{ *v[0-9]+.d, v[0-9]+.d, v[0-9]+.d *}}}[0], [{{x[0-9]+|sp}}]
}

void test_vst4q_lane_u8(uint8_t  *a, uint8x16x4_t b) {
  // CHECK-LABEL: test_vst4q_lane_u8
  vst4q_lane_u8(a, b, 15);
  // CHECK: st4 {{{ *v[0-9]+.b, v[0-9]+.b, v[0-9]+.b, v[0-9]+.b *}}}[15], [{{x[0-9]+|sp}}]
}

void test_vst4q_lane_u16(uint16_t  *a, uint16x8x4_t b) {
  // CHECK-LABEL: test_vst4q_lane_u16
  vst4q_lane_u16(a, b, 7);
  // CHECK: st4 {{{ *v[0-9]+.h, v[0-9]+.h, v[0-9]+.h, v[0-9]+.h *}}}[7], [{{x[0-9]+|sp}}]
}

void test_vst4q_lane_u32(uint32_t  *a, uint32x4x4_t b) {
  // CHECK-LABEL: test_vst4q_lane_u32
  vst4q_lane_u32(a, b, 3);
  // CHECK: st4 {{{ *v[0-9]+.s, v[0-9]+.s, v[0-9]+.s, v[0-9]+.s *}}}[3], [{{x[0-9]+|sp}}]
}

void test_vst4q_lane_u64(uint64_t  *a, uint64x2x4_t b) {
  // CHECK-LABEL: test_vst4q_lane_u64
  vst4q_lane_u64(a, b, 1);
  // CHECK: st4 {{{ *v[0-9]+.d, v[0-9]+.d, v[0-9]+.d, v[0-9]+.d *}}}[1], [{{x[0-9]+|sp}}]
}

void test_vst4q_lane_s8(int8_t  *a, int8x16x4_t b) {
  // CHECK-LABEL: test_vst4q_lane_s8
  vst4q_lane_s8(a, b, 15);
  // CHECK: st4 {{{ *v[0-9]+.b, v[0-9]+.b, v[0-9]+.b, v[0-9]+.b *}}}[15], [{{x[0-9]+|sp}}]
}

void test_vst4q_lane_s16(int16_t  *a, int16x8x4_t b) {
  // CHECK-LABEL: test_vst4q_lane_s16
  vst4q_lane_s16(a, b, 7);
  // CHECK: st4 {{{ *v[0-9]+.h, v[0-9]+.h, v[0-9]+.h, v[0-9]+.h *}}}[7], [{{x[0-9]+|sp}}]
}

void test_vst4q_lane_s32(int32_t  *a, int32x4x4_t b) {
  // CHECK-LABEL: test_vst4q_lane_s32
  vst4q_lane_s32(a, b, 3);
  // CHECK: st4 {{{ *v[0-9]+.s, v[0-9]+.s, v[0-9]+.s, v[0-9]+.s *}}}[3], [{{x[0-9]+|sp}}]
}

void test_vst4q_lane_s64(int64_t  *a, int64x2x4_t b) {
  // CHECK-LABEL: test_vst4q_lane_s64
  vst4q_lane_s64(a, b, 1);
  // CHECK: st4 {{{ *v[0-9]+.d, v[0-9]+.d, v[0-9]+.d, v[0-9]+.d *}}}[1], [{{x[0-9]+|sp}}]
}

void test_vst4q_lane_f16(float16_t  *a, float16x8x4_t b) {
  // CHECK-LABEL: test_vst4q_lane_f16
  vst4q_lane_f16(a, b, 7);
  // CHECK: st4 {{{ *v[0-9]+.h, v[0-9]+.h, v[0-9]+.h, v[0-9]+.h *}}}[7], [{{x[0-9]+|sp}}]
}

void test_vst4q_lane_f32(float32_t  *a, float32x4x4_t b) {
  // CHECK-LABEL: test_vst4q_lane_f32
  vst4q_lane_f32(a, b, 3);
  // CHECK: st4 {{{ *v[0-9]+.s, v[0-9]+.s, v[0-9]+.s, v[0-9]+.s *}}}[3], [{{x[0-9]+|sp}}]
}

void test_vst4q_lane_f64(float64_t  *a, float64x2x4_t b) {
  // CHECK-LABEL: test_vst4q_lane_f64
  vst4q_lane_f64(a, b, 1);
  // CHECK: st4 {{{ *v[0-9]+.d, v[0-9]+.d, v[0-9]+.d, v[0-9]+.d *}}}[1], [{{x[0-9]+|sp}}]
}

void test_vst4q_lane_p8(poly8_t  *a, poly8x16x4_t b) {
  // CHECK-LABEL: test_vst4q_lane_p8
  vst4q_lane_p8(a, b, 15);
  // CHECK: st4 {{{ *v[0-9]+.b, v[0-9]+.b, v[0-9]+.b, v[0-9]+.b *}}}[15], [{{x[0-9]+|sp}}]
}

void test_vst4q_lane_p16(poly16_t  *a, poly16x8x4_t b) {
  // CHECK-LABEL: test_vst4q_lane_p16
  vst4q_lane_p16(a, b, 7);
  // CHECK: st4 {{{ *v[0-9]+.h, v[0-9]+.h, v[0-9]+.h, v[0-9]+.h *}}}[7], [{{x[0-9]+|sp}}]
}

void test_vst4q_lane_p64(poly64_t  *a, poly64x2x4_t b) {
  // CHECK-LABEL: test_vst4q_lane_p64
  vst4q_lane_p64(a, b, 1);
  // CHECK: st4 {{{ *v[0-9]+.d, v[0-9]+.d, v[0-9]+.d, v[0-9]+.d *}}}[1], [{{x[0-9]+|sp}}]
}

void test_vst4_lane_u8(uint8_t  *a, uint8x8x4_t b) {
  // CHECK-LABEL: test_vst4_lane_u8
  vst4_lane_u8(a, b, 7);
  // CHECK: st4 {{{ *v[0-9]+.b, v[0-9]+.b, v[0-9]+.b, v[0-9]+.b *}}}[7], [{{x[0-9]+|sp}}]
}

void test_vst4_lane_u16(uint16_t  *a, uint16x4x4_t b) {
  // CHECK-LABEL: test_vst4_lane_u16
  vst4_lane_u16(a, b, 3);
  // CHECK: st4 {{{ *v[0-9]+.h, v[0-9]+.h, v[0-9]+.h, v[0-9]+.h *}}}[3], [{{x[0-9]+|sp}}]
}

void test_vst4_lane_u32(uint32_t  *a, uint32x2x4_t b) {
  // CHECK-LABEL: test_vst4_lane_u32
  vst4_lane_u32(a, b, 1);
  // CHECK: st4 {{{ *v[0-9]+.s, v[0-9]+.s, v[0-9]+.s, v[0-9]+.s *}}}[1], [{{x[0-9]+|sp}}]
}

void test_vst4_lane_u64(uint64_t  *a, uint64x1x4_t b) {
  // CHECK-LABEL: test_vst4_lane_u64
  vst4_lane_u64(a, b, 0);
  // CHECK: st4 {{{ *v[0-9]+.d, v[0-9]+.d, v[0-9]+.d, v[0-9]+.d *}}}[0], [{{x[0-9]+|sp}}]
}

void test_vst4_lane_s8(int8_t  *a, int8x8x4_t b) {
  // CHECK-LABEL: test_vst4_lane_s8
  vst4_lane_s8(a, b, 7);
  // CHECK: st4 {{{ *v[0-9]+.b, v[0-9]+.b, v[0-9]+.b, v[0-9]+.b *}}}[7], [{{x[0-9]+|sp}}]
}

void test_vst4_lane_s16(int16_t  *a, int16x4x4_t b) {
  // CHECK-LABEL: test_vst4_lane_s16
  vst4_lane_s16(a, b, 3);
  // CHECK: st4 {{{ *v[0-9]+.h, v[0-9]+.h, v[0-9]+.h, v[0-9]+.h *}}}[3], [{{x[0-9]+|sp}}]
}

void test_vst4_lane_s32(int32_t  *a, int32x2x4_t b) {
  // CHECK-LABEL: test_vst4_lane_s32
  vst4_lane_s32(a, b, 1);
  // CHECK: st4 {{{ *v[0-9]+.s, v[0-9]+.s, v[0-9]+.s, v[0-9]+.s *}}}[1], [{{x[0-9]+|sp}}]
}

void test_vst4_lane_s64(int64_t  *a, int64x1x4_t b) {
  // CHECK-LABEL: test_vst4_lane_s64
  vst4_lane_s64(a, b, 0);
  // CHECK: st4 {{{ *v[0-9]+.d, v[0-9]+.d, v[0-9]+.d, v[0-9]+.d *}}}[0], [{{x[0-9]+|sp}}]
}

void test_vst4_lane_f16(float16_t  *a, float16x4x4_t b) {
  // CHECK-LABEL: test_vst4_lane_f16
  vst4_lane_f16(a, b, 3);
  // CHECK: st4 {{{ *v[0-9]+.h, v[0-9]+.h, v[0-9]+.h, v[0-9]+.h *}}}[3], [{{x[0-9]+|sp}}]
}

void test_vst4_lane_f32(float32_t  *a, float32x2x4_t b) {
  // CHECK-LABEL: test_vst4_lane_f32
  vst4_lane_f32(a, b, 1);
  // CHECK: st4 {{{ *v[0-9]+.s, v[0-9]+.s, v[0-9]+.s, v[0-9]+.s *}}}[1], [{{x[0-9]+|sp}}]
}

void test_vst4_lane_f64(float64_t  *a, float64x1x4_t b) {
  // CHECK-LABEL: test_vst4_lane_f64
  vst4_lane_f64(a, b, 0);
  // CHECK: st4 {{{ *v[0-9]+.d, v[0-9]+.d, v[0-9]+.d, v[0-9]+.d *}}}[0], [{{x[0-9]+|sp}}]
}

void test_vst4_lane_p8(poly8_t  *a, poly8x8x4_t b) {
  // CHECK-LABEL: test_vst4_lane_p8
  vst4_lane_p8(a, b, 7);
  // CHECK: st4 {{{ *v[0-9]+.b, v[0-9]+.b, v[0-9]+.b, v[0-9]+.b *}}}[7], [{{x[0-9]+|sp}}]
}

void test_vst4_lane_p16(poly16_t  *a, poly16x4x4_t b) {
  // CHECK-LABEL: test_vst4_lane_p16
  vst4_lane_p16(a, b, 3);
  // CHECK: st4 {{{ *v[0-9]+.h, v[0-9]+.h, v[0-9]+.h, v[0-9]+.h *}}}[3], [{{x[0-9]+|sp}}]
}

void test_vst4_lane_p64(poly64_t  *a, poly64x1x4_t b) {
  // CHECK-LABEL: test_vst4_lane_p64
  vst4_lane_p64(a, b, 0);
  // CHECK: st4 {{{ *v[0-9]+.d, v[0-9]+.d, v[0-9]+.d, v[0-9]+.d *}}}[0], [{{x[0-9]+|sp}}]
}