#include <stdint.h>
#include <inttypes.h>
#include <stdlib.h>
#include <string.h>
#include <stdio.h>
#include <assert.h>
#include "opcodes.h"
/* The abstracted result of an CU41 insn */
typedef struct {
uint64_t addr1; // target
uint64_t len1;
uint64_t addr2; // source
uint64_t len2;
uint32_t cc;
} cu41_t;
/* Define various input buffers. */
/* 0000 to 00ff: Result is 1 byte for each uint32_t */
uint32_t pattern1[] = {
0x0000, 0x007f, /* corner cases */
0x0001, 0x007e, 0x0030, 0x005e /* misc */
};
/* 0080 to 07ff: Result is 2 bytes for each uint32_t */
uint32_t pattern2[] = {
0x0080, 0x07ff, /* corner cases */
0x0081, 0x07fe, 0x100, 0x333, 0x555, 0x6aa /* misc */
};
/* 0800 to d7ff: Result is 3 bytes for each uint32_t */
/* dc00 to ffff: Result is 3 bytes for each uint32_t */
uint32_t pattern3[] = {
0x0800, 0xd7ff, /* corner cases */
0xdc00, 0xffff, /* corner cases */
0xdc01, 0xfffe, 0xdea0, 0xd00d, 0xe555 /* misc */
};
/* 10000 to 10ffff: Result is 4 bytes for each uint32_t */
uint32_t pattern4[] = {
0x10000, 0x10ffff, /* corner cases */
0x10001, 0x10fffe, 0x12345, 0x23456, 0xfedcb /* misc */
};
/* Invalid UTF-32 character */
uint32_t invalid[] = {
0x0000d800, 0x0000dbff, /* corner cases */
0x00110000, 0xffffffff, /* corner cases */
0x0000daad, 0x0000d901, 0x0000d8ff, /* misc */
0x00110011, 0x01000000, 0x10000000, 0xdeadbeef /* misc */
};
/* Mixed bytes */
uint32_t mixed[] = {
0x00000078 /* 1 byte */,
0x00000111 /* 2 bytes */,
0x00001234 /* 3 bytes */,
0x00040404 /* 4 bytes */,
};
/* This is the buffer for the converted bytes. */
uint8_t buff[1000]; /* Large so we con'don't have to worry about it */
void write_and_check(uint32_t *, unsigned, unsigned);
static cu41_t
do_cu41(uint8_t *dst, uint64_t dst_len, uint32_t *src, uint64_t src_len)
{
int cc = 42;
cu41_t regs;
/* build up the register pairs */
register uint32_t *source asm("4") = src;
register uint64_t source_len asm("5") = src_len;
register uint8_t *dest asm("2") = dst;
register uint64_t dest_len asm("3") = dst_len;
asm volatile(
CU41(2,4)
"ipm %2\n\t"
"srl %2,28\n\t"
: "+d"(dest), "+d"(source), "=d"(cc),
"+d"(source_len), "+d"(dest_len)
:
: "memory", "cc");
/* Capture register contents at end of cu41 */
regs.addr1 = (uint64_t)dest;
regs.len1 = dest_len;
regs.addr2 = (uint64_t)source;
regs.len2 = source_len;
regs.cc = cc;
return regs;
}
void
run_test(uint8_t *dst, uint64_t dst_len, uint32_t *src, uint64_t src_len)
{
int i;
cu41_t result;
result = do_cu41(dst, dst_len, src, src_len);
// Write out the converted values, if any
printf("UTF8: ");
if (dst_len - result.len1 == 0)
printf(" <none>");
else
for (i = 0; i < dst_len - result.len1; ++i) {
printf(" %02x", dst[i]);
}
printf("\n");
printf(" cc = %d\n", result.cc);
if (dst != NULL)
printf(" dst address difference: %"PRId64, result.addr1 - (uint64_t)dst);
printf(" dst len: %"PRId64"\n", result.len1);
if (src != NULL)
printf(" src address difference: %"PRId64, result.addr2 - (uint64_t)src);
printf(" src len: %"PRId64"\n", result.len2);
}
int main()
{
int i;
/* Length == 0, no memory should be read or written */
printf("\n------------- test1 ----------------\n");
run_test(NULL, 0, NULL, 0);
/* Test exhaustion of source length (source bytes are valid) */
printf("\n------------- test2.1 ----------------\n");
/* No character will be written to BUFF, i.e. loop in jitted code
is not iterated */
run_test(buff, sizeof buff, NULL, 0);
run_test(buff, sizeof buff, NULL, 1);
run_test(buff, sizeof buff, NULL, 2);
run_test(buff, sizeof buff, NULL, 3);
run_test(buff, sizeof buff, pattern1, 0);
run_test(buff, sizeof buff, pattern1, 1);
run_test(buff, sizeof buff, pattern1, 2);
run_test(buff, sizeof buff, pattern1, 3);
printf("\n------------- test2.2 ----------------\n");
/* At least one character will be written to BUFF, i.e. loop in jitted
code is iterated */
run_test(buff, sizeof buff, pattern1, 4); /* 1 utf32 -> 1 1-byte utf8 */
run_test(buff, sizeof buff, pattern2, 10); /* 2 utf32 -> 2 2-byte utf8 */
run_test(buff, sizeof buff, pattern3, 5); /* 1 utf32 -> 1 3-byte utf8 */
run_test(buff, sizeof buff, pattern4, 21); /* 5 utf32 -> 5 4-byte utf8 */
/* Test exhaustion of destination length (source bytes are valid) */
printf("\n------------- test3.1 ----------------\n");
/* No character will be written to BUFF, i.e. loop in jitted code
is not iterated */
/* Want to write at least 1 byte */
run_test(NULL, 0, pattern1, sizeof pattern1);
/* Want to write at least 2 bytes */
run_test(NULL, 0, pattern2, sizeof pattern2);
run_test(NULL, 1, pattern2, sizeof pattern2);
/* Want to write at least 3 bytes */
run_test(NULL, 0, pattern3, sizeof pattern3);
run_test(NULL, 1, pattern3, sizeof pattern3);
/* Want to write at least 4 bytes */
run_test(NULL, 0, pattern4, sizeof pattern4);
run_test(NULL, 1, pattern4, sizeof pattern4);
run_test(NULL, 2, pattern4, sizeof pattern4);
run_test(NULL, 3, pattern4, sizeof pattern4);
/* When both operands are exhausted, cc=0 takes precedence.
(test1 tests this for len == 0) */
printf("\n------------- test4 ----------------\n");
run_test(buff, 2, pattern1, 8);
/* Input contains invalid characters */
// As conversion stops upon encountering an invalid character, we
// need to test each invalid character separately, to make sure it
// is recognized as invalid.
printf("\n------------- test5 ----------------\n");
for (i = 0; i < sizeof invalid / 4; ++i) {
run_test(buff, sizeof buff, invalid + i, 4);
}
run_test(buff, 0, invalid, sizeof invalid); // cc = 2
run_test(buff, 100, invalid, sizeof invalid);
/* Convert all pattern buffers */
printf("\n------------- test6 ----------------\n");
run_test(buff, sizeof buff, pattern1, sizeof pattern1);
run_test(buff, sizeof buff, pattern2, sizeof pattern2);
run_test(buff, sizeof buff, pattern3, sizeof pattern3);
run_test(buff, sizeof buff, pattern4, sizeof pattern4);
run_test(buff, sizeof buff, mixed, sizeof mixed);
/* Make sure we only write the exact number of bytes (and not more) */
/* Write 1 byte */
printf("\n------------- test7.0 ----------------\n");
write_and_check(pattern1 + 2, 4, 1);
/* Write 2 bytes */
printf("\n------------- test7.1 ----------------\n");
write_and_check(pattern2 + 3, 4, 2);
/* Write 3 bytes */
printf("\n------------- test7.2 ----------------\n");
write_and_check(pattern3 + 6, 4, 3);
/* Write 4 bytes */
printf("\n------------- test7.3 ----------------\n");
write_and_check(pattern4 + 5, 4, 4);
return 0;
}
void
write_and_check_aux(uint32_t *input, unsigned num_input_bytes,
unsigned num_expected_output_bytes,
unsigned fill_byte)
{
int num_errors, i;
/* Fill output buffer with FILL_BYTE */
memset(buff, fill_byte, sizeof buff);
/* Execute cu41 */
run_test(buff, sizeof buff, input, num_input_bytes);
/* Make sure the rest of the buffer is unmodified. */
num_errors = 0;
for (i = num_expected_output_bytes; i < sizeof buff; ++i)
if (((unsigned char *)buff)[i] != fill_byte) ++num_errors;
if (num_errors)
fprintf(stderr, "*** wrote more than %d bytes\n",
num_expected_output_bytes);
}
void
write_and_check(uint32_t *input, unsigned num_input_bytes,
unsigned num_expected_output_bytes)
{
write_and_check_aux(input, num_input_bytes, num_expected_output_bytes, 0x0);
/* Run again with different fill pattern to make sure we did not write
an extra 0x0 byte */
write_and_check_aux(input, num_input_bytes, num_expected_output_bytes, 0xFF);
}