#include <stdint.h> #include <inttypes.h> #include <stdlib.h> #include <string.h> #include <stdio.h> #include <assert.h> #include "opcodes.h" /* The abstracted result of an CU42 insn */ typedef struct { uint64_t addr1; // target uint64_t len1; uint64_t addr2; // source uint64_t len2; uint32_t cc; } cu42_t; /* Define various input buffers. */ /* U+0000 to U+d7ff: Result is 2 bytes for each uint32_t U+dc00 to U+ffff: Result is 2 bytes for each uint32_t */ uint32_t pattern2[] = { 0x0000, 0xd7ff, /* corner cases */ 0xdc00, 0xffff, /* corner cases */ 0xabba, 0xf00d, 0xd00f, 0x1234 /* misc */ }; /* U+00010000 to U+0010ffff: Result is 4 bytes for each uint32_t */ uint32_t pattern4[] = { 0x00010000, 0x0010ffff, /* corner cases */ 0x00010123, 0x00023456, 0x000789ab, 0x00100000 /* misc */ }; /* Invalid UTF-32 character */ uint32_t invalid[] = { 0x0000d800, 0x0000dbff, /* corner cases */ 0x00110000, 0xffffffff, /* corner cases */ 0x0000daad, 0x0000d901, 0x0000d8ff, /* misc */ 0x00110011, 0x01000000, 0x10000000, 0xdeadbeef /* misc */ }; /* Mixed bytes */ uint32_t mixed[] = { 0x00000078 /* 2 bytes */, 0x0000d000 /* 2 bytes */, 0x00033333 /* 4 bytes */, 0x00040404 /* 4 bytes */, 0x0000abcd /* 2 bytes */, }; /* This is the buffer for the converted bytes. */ uint16_t buff[1000]; /* Large so we con'don't have to worry about it */ void write_and_check(uint32_t *, unsigned, unsigned); static cu42_t do_cu42(uint16_t *dst, uint64_t dst_len, uint32_t *src, uint64_t src_len) { int cc = 42; cu42_t regs; /* build up the register pairs */ register uint32_t *source asm("4") = src; register uint64_t source_len asm("5") = src_len; register uint16_t *dest asm("2") = dst; register uint64_t dest_len asm("3") = dst_len; asm volatile( CU42(2,4) "ipm %2\n\t" "srl %2,28\n\t" : "+d"(dest), "+d"(source), "=d"(cc), "+d"(source_len), "+d"(dest_len) : : "memory", "cc"); /* Capture register contents at end of cu42 */ regs.addr1 = (uint64_t)dest; regs.len1 = dest_len; regs.addr2 = (uint64_t)source; regs.len2 = source_len; regs.cc = cc; return regs; } void run_test(uint16_t *dst, uint64_t dst_len, uint32_t *src, uint64_t src_len) { int i; cu42_t result; result = do_cu42(dst, dst_len, src, src_len); // Write out the converted values, if any printf("UTF16: "); if (dst_len - result.len1 == 0) printf(" <none>"); else assert((dst_len - result.len1) % 2 == 0); for (i = 0; i < (dst_len - result.len1) / 2; ++i) { printf(" %04x", dst[i]); } printf("\n"); printf(" cc = %d\n", result.cc); if (dst != NULL) printf(" dst address difference: %"PRId64, result.addr1 - (uint64_t)dst); printf(" dst len: %"PRId64"\n", result.len1); if (src != NULL) printf(" src address difference: %"PRId64, result.addr2 - (uint64_t)src); printf(" src len: %"PRId64"\n", result.len2); } int main() { int i; /* Length == 0, no memory should be read or written */ printf("\n------------- test1 ----------------\n"); run_test(NULL, 0, NULL, 0); /* Test exhaustion of source length (source bytes are valid) */ printf("\n------------- test2.1 ----------------\n"); /* No character will be written to BUFF, i.e. loop in jitted code is not iterated */ run_test(buff, sizeof buff, NULL, 0); run_test(buff, sizeof buff, NULL, 1); run_test(buff, sizeof buff, NULL, 2); run_test(buff, sizeof buff, NULL, 3); run_test(buff, sizeof buff, pattern2, 0); run_test(buff, sizeof buff, pattern2, 1); run_test(buff, sizeof buff, pattern2, 2); run_test(buff, sizeof buff, pattern2, 3); printf("\n------------- test2.2 ----------------\n"); /* At least one character will be written to BUFF, i.e. loop in jitted code is iterated */ run_test(buff, sizeof buff, pattern2, 4); /* 1 utf32 -> 1 utf16 */ run_test(buff, sizeof buff, pattern2, 10); /* 2 utf32 -> 2 utf16 */ run_test(buff, sizeof buff, pattern4, 5); /* 1 utf32 -> 2 utf16 */ run_test(buff, sizeof buff, pattern4, 11); /* 2 utf32 -> 4 utf16 */ run_test(buff, sizeof buff, pattern4, 18); /* 4 utf32 -> 8 utf16 */ /* Test exhaustion of destination length (source bytes are valid) */ printf("\n------------- test3.1 ----------------\n"); /* No character will be written to BUFF, i.e. loop in jitted code is not iterated */ /* Want to write at least 1 UTF-16 */ run_test(NULL, 0, pattern2, sizeof pattern2); /* Want to write at least 1 UTF-16 */ run_test(NULL, 0, pattern2, sizeof pattern2); run_test(NULL, 1, pattern2, sizeof pattern2); /* Want to write at least 2 UTF-16 */ run_test(NULL, 0, pattern4, sizeof pattern4); run_test(NULL, 1, pattern4, sizeof pattern4); run_test(NULL, 2, pattern4, sizeof pattern4); run_test(NULL, 3, pattern4, sizeof pattern4); /* When both operands are exhausted, cc=0 takes precedence. (test1 tests this for len == 0) */ printf("\n------------- test4 ----------------\n"); run_test(buff, 4, pattern2, 8); /* Input contains invalid characters */ // As conversion stops upon encountering an invalid character, we // need to test each invalid character separately, to make sure it // is recognized as invalid. printf("\n------------- test5 ----------------\n"); for (i = 0; i < sizeof invalid / 4; ++i) { run_test(buff, sizeof buff, invalid + i, 4); } run_test(buff, 0, invalid, sizeof invalid); // cc = 2 run_test(buff, 100, invalid, sizeof invalid); /* Convert all pattern buffers */ printf("\n------------- test6 ----------------\n"); run_test(buff, sizeof buff, pattern2, sizeof pattern2); run_test(buff, sizeof buff, pattern4, sizeof pattern4); run_test(buff, sizeof buff, mixed, sizeof mixed); /* Make sure we only write the exact number of bytes (and not more) */ /* Write 2 bytes */ printf("\n------------- test7.1 ----------------\n"); write_and_check(pattern2 + 3, 4, 2); /* Write 4 bytes */ printf("\n------------- test7.2 ----------------\n"); write_and_check(pattern4 + 5, 4, 4); return 0; } void write_and_check_aux(uint32_t *input, unsigned num_input_bytes, unsigned num_expected_output_bytes, unsigned fill_byte) { int num_errors, i; /* Fill output buffer with FILL_BYTE */ memset(buff, fill_byte, sizeof buff); /* Execute cu42 */ run_test(buff, sizeof buff, input, num_input_bytes); /* Make sure the rest of the buffer is unmodified. */ num_errors = 0; for (i = num_expected_output_bytes; i < sizeof buff; ++i) if (((unsigned char *)buff)[i] != fill_byte) ++num_errors; if (num_errors) fprintf(stderr, "*** wrote more than %d bytes\n", num_expected_output_bytes); } void write_and_check(uint32_t *input, unsigned num_input_bytes, unsigned num_expected_output_bytes) { write_and_check_aux(input, num_input_bytes, num_expected_output_bytes, 0x0); /* Run again with different fill pattern to make sure we did not write an extra 0x0 byte */ write_and_check_aux(input, num_input_bytes, num_expected_output_bytes, 0xFF); }