/*
gcc -g -o v8memory_a -march=armv8-a -mfpu=crypto-neon-fp-armv8 \
none/tests/arm/v8memory.c -I. -Wall -marm
gcc -g -o v8memory_t -march=armv8-a -mfpu=crypto-neon-fp-armv8 \
none/tests/arm/v8memory.c -I. -Wall -mthumb
*/
/* These tests unfortunately are unable to check the relative
placement (or, even, presence) of the required memory fences
relative to the store/load required. They only verify the
data-movement component. */
#include <stdio.h>
#include <malloc.h> // memalign
#include <string.h> // memset
#include "tests/malloc.h"
#include <assert.h>
typedef unsigned char UChar;
typedef unsigned short int UShort;
typedef unsigned int UInt;
typedef signed int Int;
typedef unsigned char UChar;
typedef signed long long int Long;
typedef unsigned long long int ULong;
typedef unsigned char Bool;
#define False ((Bool)0)
#define True ((Bool)1)
static inline UChar randUChar ( void )
{
static UInt seed = 90210; // Somewhere in Beverly Hills, allegedly.
seed = 1103515245 * seed + 12345;
return (seed >> 17) & 0xFF;
}
static UInt randUInt ( void )
{
Int i;
UInt r = 0;
for (i = 0; i < 4; i++) {
r = (r << 8) | (UInt)(0xFF & randUChar());
}
return r;
}
static void show_block_xor ( UChar* block1, UChar* block2, Int n )
{
Int i;
printf(" ");
for (i = 0; i < n; i++) {
if (i > 0 && 0 == (i & 15)) printf("\n ");
if (0 == (i & 15)) printf("[%3d] ", i);
UInt diff = 0xFF & (UInt)(block1[i] - block2[i]);
if (diff == 0)
printf(".. ");
else
printf("%02x ", diff);
}
printf("\n");
}
// INSN may mention the following regs as containing load/store data:
// r2 r3 r6 r9
// INSN must mention the following reg as containing the EA: r10
//
// INSN can use r4 and r5 as scratch
//
// In: rand: memory area (128 bytes), r2, r3, r6, r9
// r10 pointing to middle of memory area
//
// Out: memory area, r2, r3, r6, r9, r10
//
// What is printed out: the XOR of the new and old versions of the
// following:
// the memory area
// r2, r3 r6 r9 r10
#define MEM_TEST(INSN) { \
int i; \
const int N = 128; \
UChar* area1 = memalign16(N); \
UChar* area2 = memalign16(N); \
for (i = 0; i < N; i++) area1[i] = area2[i] = randUChar(); \
UInt block1[5]; \
UInt block2[5]; \
/* 0:r2 1:r3 2:r6 3:r9 4:r10 */ \
for (i = 0; i < 5; i++) block1[i] = block2[i] = randUInt(); \
block1[4] = block2[4] = (UInt)(&area1[N/2]); \
__asm__ __volatile__( \
"ldr r2, [%0, #0] ; " \
"ldr r3, [%0, #4] ; " \
"ldr r6, [%0, #8] ; " \
"ldr r9, [%0, #12] ; " \
"ldr r10, [%0, #16] ; " \
INSN " ; " \
"str r2, [%0, #0] ; " \
"str r3, [%0, #4] ; " \
"str r6, [%0, #8] ; " \
"str r9, [%0, #12] ; " \
"str r10, [%0, #16] ; " \
: : "r"(&block1[0]) : "r2", "r3", "r4", "r5", "r6", "r9", "r10", \
"memory", "cc" \
); \
printf("%s with r10 = middle_of_block\n", INSN); \
show_block_xor(&area1[0], &area2[0], N); \
printf(" %08x r2 (xor, data intreg #1)\n", block1[0] ^ block2[0]); \
printf(" %08x r3 (xor, data intreg #2)\n", block1[1] ^ block2[1]); \
printf(" %08x r6 (xor, data intreg #3)\n", block1[2] ^ block2[2]); \
printf(" %08x r9 (xor, data intreg #4)\n", block1[3] ^ block2[3]); \
printf(" %08x r10 (xor, addr intreg #1)\n", block1[4] ^ block2[4]); \
printf("\n"); \
free(area1); free(area2); \
}
int main ( void )
{
////////////////////////////////////////////////////////////////
printf("LDA{,B,H} (reg)\n\n");
MEM_TEST("lda r6, [r10]")
MEM_TEST("ldab r9, [r10]")
MEM_TEST("ldah r3, [r10]")
////////////////////////////////////////////////////////////////
printf("STL{,B,H} (reg)\n\n");
MEM_TEST("stl r6, [r10]")
MEM_TEST("stlb r9, [r10]")
MEM_TEST("stlh r3, [r10]")
////////////////////////////////////////////////////////////////
printf("LDAEX{,B,H,D} (reg)\n\n");
MEM_TEST("ldaex r6, [r10]")
MEM_TEST("ldaexb r9, [r10]")
MEM_TEST("ldaexh r3, [r10]")
MEM_TEST("ldaexd r2, r3, [r10]")
////////////////////////////////////////////////////////////////
// These verify that stlex* do notice a cleared (missing) reservation.
printf("STLEX{,B,H,D} (reg) -- expected to fail\n\n");
MEM_TEST("clrex; stlex r9, r6, [r10]")
MEM_TEST("clrex; stlexb r9, r6, [r10]")
MEM_TEST("clrex; stlexh r9, r3, [r10]")
MEM_TEST("clrex; stlexd r9, r2, r3, [r10]")
////////////////////////////////////////////////////////////////
// These verify that stlex* do notice a successful reservation.
// By using ldaex* to create the reservation in the first place,
// they also verify that ldaex* actually create a reservation.
printf("STLEX{,B,H,D} (reg) -- expected to succeed\n\n");
MEM_TEST("ldaex r2, [r10] ; stlex r9, r6, [r10]")
MEM_TEST("ldaexb r2, [r10] ; stlexb r9, r6, [r10]")
MEM_TEST("ldaexh r2, [r10] ; stlexh r9, r3, [r10]")
MEM_TEST("mov r4, r2 ; mov r5, r3 ; " // preserve r2/r3 around the ldrexd
"ldaexd r2, r3, [r10] ; "
"mov r2, r4 ; mov r3, r5 ; "
"stlexd r9, r2, r3, [r10]")
return 0;
}