#include "test.h" #define M64 67108864 #define aB1 (1<<1) #define aB2 (1<<2) #define aB3 (1<<3) #define aB4 (1<<4) #define aB5 (1<<5) #define aB6 (1<<6) #define aB7 (1<<7) #define aB8 (1<<8) #define aB9 (1<<9) #define aB10 (1<<10) #define aB11 (1<<11) #define aB12 (1<<12) #define aB13 (1<<13) #define aB14 (1<<14) #define aB15 (1<<15) #define aB16 (1<<16) #define aB17 (1<<17) #define aB18 (1<<18) #define aB19 (1<<19) #define aB20 (1<<20) #define aB21 (1<<21) #define aB22 (1<<22) #define aB23 (1<<23) #define aB24 (1<<24) #define aB25 (1<<25) #define aB26 (1<<26) #define bB1 (-aB1) #define bB2 (-aB2) #define bB3 (-aB3) #define bB4 (-aB4) #define bB5 (-aB5) #define bB6 (-aB6) #define bB7 (-aB7) #define bB8 (-aB8) #define bB9 (-aB9) #define bB10 (-aB10) #define bB11 (-aB11) #define bB12 (-aB12) #define bB13 (-aB13) #define bB14 (-aB14) #define bB15 (-aB15) #define bB16 (-aB16) #define bB17 (-aB17) #define bB18 (-aB18) #define bB19 (-aB19) #define bB20 (-aB20) #define bB21 (-aB21) #define bB22 (-aB22) #define bB23 (-aB23) #define bB24 (-aB24) #define bB25 (-aB25) #define bB26 (-aB26) #define cB1 (aB1-1) #define cB2 (aB2-1) #define cB3 (aB3-1) #define cB4 (aB4-1) #define cB5 (aB5-1) #define cB6 (aB6-1) #define cB7 (aB7-1) #define cB8 (aB8-1) #define cB9 (aB9-1) #define cB10 (aB10-1) #define cB11 (aB11-1) #define cB12 (aB12-1) #define cB13 (aB13-1) #define cB14 (aB14-1) #define cB15 (aB15-1) #define cB16 (aB16-1) #define cB17 (aB17-1) #define cB18 (aB18-1) #define cB19 (aB19-1) #define cB20 (aB20-1) #define cB21 (aB21-1) #define cB22 (aB22-1) #define cB23 (aB23-1) #define cB24 (aB24-1) #define cB25 (aB25-1) #define cB26 (aB26-1) #define dB1 (-aB1+1) #define dB2 (-aB2+1) #define dB3 (-aB3+1) #define dB4 (-aB4+1) #define dB5 (-aB5+1) #define dB6 (-aB6+1) #define dB7 (-aB7+1) #define dB8 (-aB8+1) #define dB9 (-aB9+1) #define dB10 (-aB10+1) #define dB11 (-aB11+1) #define dB12 (-aB12+1) #define dB13 (-aB13+1) #define dB14 (-aB14+1) #define dB15 (-aB15+1) #define dB16 (-aB16+1) #define dB17 (-aB17+1) #define dB18 (-aB18+1) #define dB19 (-aB19+1) #define dB20 (-aB20+1) #define dB21 (-aB21+1) #define dB22 (-aB22+1) #define dB23 (-aB23+1) #define dB24 (-aB24+1) #define dB25 (-aB25+1) #define dB26 (-aB26+1) #define add(a, b) (a + b) #define sub(a, b) (a - b) #define mul(a, b) (a * b) #define div(a, b) (a / b) #define rem(a, b) (a % b) #define and(a, b) (a & b) #define or(a, b) (a | b) #define xor(a, b) (a ^ b) #if defined(DEBUG) #define dump_args(N, X, L, R, V)\ jit_calli_1(_jit, puts,\ jit_operand_imm(JIT_OPERAND_ABI_POINTER,\ (jit_imm_t)#N " " #X " " #L " " #R " " #V)) #else #define dump_args(N, X, L, R, V) #endif #define jit_rshi_ui jit_rshi_u #define alu2(N, X, L, R, V) \ { \ dump_args(N, X, L, R, V); \ jit_movi(_jit, JIT_R1, L); \ jit_movi(_jit, JIT_R2, R); \ jit_##N##r(_jit, JIT_R0, JIT_R1, JIT_R2); \ jit_reloc_t r = jit_beqi(_jit, JIT_R0, V); \ jit_calli_0(_jit, abort); \ jit_patch_here(_jit, r); \ } #define alu1(N, M) \ alu2(N, N##M##1, 3, (M##1), N(3, M##1)) \ alu2(N, N##M##2, 3, (M##2), N(3, M##2)) \ alu2(N, N##M##3, 3, (M##3), N(3, M##3)) \ alu2(N, N##M##4, 3, (M##4), N(3, M##4)) \ alu2(N, N##M##5, 3, (M##5), N(3, M##5)) \ alu2(N, N##M##6, 3, (M##6), N(3, M##6)) \ alu2(N, N##M##7, 3, (M##7), N(3, M##7)) \ alu2(N, N##M##8, 3, (M##8), N(3, M##8)) \ alu2(N, N##M##9, 3, (M##9), N(3, M##9)) \ alu2(N, N##M##10, 3, (M##10), N(3, M##10)) \ alu2(N, N##M##11, 3, (M##11), N(3, M##11)) \ alu2(N, N##M##12, 3, (M##12), N(3, M##12)) \ alu2(N, N##M##13, 3, (M##13), N(3, M##13)) \ alu2(N, N##M##14, 3, (M##14), N(3, M##14)) \ alu2(N, N##M##15, 3, (M##15), N(3, M##15)) \ alu2(N, N##M##16, 3, (M##16), N(3, M##16)) \ alu2(N, N##M##17, 3, (M##17), N(3, M##17)) \ alu2(N, N##M##18, 3, (M##18), N(3, M##18)) \ alu2(N, N##M##19, 3, (M##19), N(3, M##19)) \ alu2(N, N##M##20, 3, (M##20), N(3, M##20)) \ alu2(N, N##M##21, 3, (M##21), N(3, M##21)) \ alu2(N, N##M##22, 3, (M##22), N(3, M##22)) \ alu2(N, N##M##23, 3, (M##23), N(3, M##23)) \ alu2(N, N##M##24, 3, (M##24), N(3, M##24)) \ alu2(N, N##M##25, 3, (M##25), N(3, M##25)) \ alu2(N, N##M##26, 3, (M##26), N(3, M##26)) #define alu(N) \ alu1(N, aB) \ alu1(N, bB) \ alu1(N, cB) \ alu1(N, dB) #define _lsh(N) \ alu2(lsh, L##N, 1, N, (1L<>N)) #define _rush(N) \ alu2(rsh_u, R##N, (1UL<<63), N, ((1UL<<63)>>N)) #else #define _rsh(N) \ alu2(rsh, R##N, (1L<<31), N, ((1L<<31)>>N)) #define _rush(N) \ alu2(rsh_u, R##N, (1UL<<31), N, ((1UL<<31)>>N)) #endif #if __WORDSIZE == 32 # define xsh64(X) /**/ #else # define xsh64(X) \ _##X##sh(32) \ _##X##sh(33) \ _##X##sh(34) \ _##X##sh(35) \ _##X##sh(36) \ _##X##sh(37) \ _##X##sh(38) \ _##X##sh(39) \ _##X##sh(40) \ _##X##sh(41) \ _##X##sh(42) \ _##X##sh(43) \ _##X##sh(44) \ _##X##sh(45) \ _##X##sh(46) \ _##X##sh(47) \ _##X##sh(48) \ _##X##sh(49) \ _##X##sh(50) \ _##X##sh(51) \ _##X##sh(52) \ _##X##sh(53) \ _##X##sh(54) \ _##X##sh(55) \ _##X##sh(56) \ _##X##sh(57) \ _##X##sh(58) \ _##X##sh(59) \ _##X##sh(60) \ _##X##sh(61) \ _##X##sh(62) \ _##X##sh(63) #endif #define xsh(X) \ _##X##sh(0) \ _##X##sh(1) \ _##X##sh(2) \ _##X##sh(3) \ _##X##sh(4) \ _##X##sh(5) \ _##X##sh(6) \ _##X##sh(7) \ _##X##sh(8) \ _##X##sh(9) \ _##X##sh(10) \ _##X##sh(11) \ _##X##sh(12) \ _##X##sh(13) \ _##X##sh(14) \ _##X##sh(15) \ _##X##sh(16) \ _##X##sh(17) \ _##X##sh(18) \ _##X##sh(19) \ _##X##sh(20) \ _##X##sh(21) \ _##X##sh(22) \ _##X##sh(23) \ _##X##sh(24) \ _##X##sh(25) \ _##X##sh(26) \ _##X##sh(27) \ _##X##sh(28) \ _##X##sh(29) \ _##X##sh(30) \ _##X##sh(31) \ xsh64(X) #define lsh() \ xsh(l) #define rsh() \ xsh(r) #define rsh_u() \ xsh(ru) #define reset(V) \ jit_calli_3(_jit, memset, \ jit_operand_imm(JIT_OPERAND_ABI_POINTER, (jit_imm_t)buf),\ jit_operand_imm(JIT_OPERAND_ABI_INT32, V), \ jit_operand_imm(JIT_OPERAND_ABI_UINT32, M64 + 8)); #define stx(T, N, O, V) \ jit_movi(_jit, JIT_R0, V); \ jit_movi(_jit, JIT_R1, O); \ jit_stxr##T(_jit, JIT_R1, JIT_V0, JIT_R0); #define stx8(T, M, V) \ stx(T, 3, (M##B3), V) \ stx(T, 4, (M##B4), V) \ stx(T, 5, (M##B5), V) \ stx(T, 6, (M##B6), V) \ stx(T, 7, (M##B7), V) \ stx(T, 8, (M##B8), V) \ stx(T, 9, (M##B9), V) \ stx(T, 10, (M##B10), V) \ stx(T, 11, (M##B11), V) \ stx(T, 12, (M##B12), V) \ stx(T, 13, (M##B13), V) \ stx(T, 14, (M##B14), V) \ stx(T, 15, (M##B15), V) \ stx(T, 16, (M##B16), V) \ stx(T, 17, (M##B17), V) \ stx(T, 18, (M##B18), V) \ stx(T, 19, (M##B19), V) \ stx(T, 20, (M##B20), V) \ stx(T, 21, (M##B21), V) \ stx(T, 22, (M##B22), V) \ stx(T, 23, (M##B23), V) \ stx(T, 24, (M##B24), V) \ stx(T, 25, (M##B25), V) \ stx(T, 26, (M##B26), V) #define stx4(T, M, V) \ stx(T, 2, (M##B2), V) \ stx8(T, M, V) #define stx2(T, M, V) \ stx(T, 1, (M##B1), V) \ stx4(T, M, V) #define ldx(T, N, M, O, V) \ { \ dump_args(T, N, M, O, V); \ jit_movi(_jit, JIT_R0, 0); \ jit_ldxi##T(_jit, JIT_R0, JIT_V0, O); \ jit_reloc_t r = jit_beqi(_jit, JIT_R0, V); \ jit_calli_0(_jit, abort); \ jit_patch_here(_jit, r); \ } #define ldx8(T, M, V) \ ldx(T, 3, M, (M##B3), V) \ ldx(T, 4, M, (M##B4), V) \ ldx(T, 5, M, (M##B5), V) \ ldx(T, 6, M, (M##B6), V) \ ldx(T, 7, M, (M##B7), V) \ ldx(T, 8, M, (M##B8), V) \ ldx(T, 9, M, (M##B9), V) \ ldx(T, 10, M, (M##B10), V) \ ldx(T, 11, M, (M##B11), V) \ ldx(T, 12, M, (M##B12), V) \ ldx(T, 13, M, (M##B13), V) \ ldx(T, 14, M, (M##B14), V) \ ldx(T, 15, M, (M##B15), V) \ ldx(T, 16, M, (M##B16), V) \ ldx(T, 17, M, (M##B17), V) \ ldx(T, 18, M, (M##B18), V) \ ldx(T, 19, M, (M##B19), V) \ ldx(T, 20, M, (M##B20), V) \ ldx(T, 21, M, (M##B21), V) \ ldx(T, 22, M, (M##B22), V) \ ldx(T, 23, M, (M##B23), V) \ ldx(T, 24, M, (M##B24), V) \ ldx(T, 25, M, (M##B25), V) \ ldx(T, 26, M, (M##B26), V) #define ldx4(T, M, V) \ ldx(T, 2, M, (M##B2), V) \ ldx8(T, M, V) #define ldx2(T, M, V) \ ldx(T, 1, M, (M##B1), V) \ ldx4(T, M, V) #define stf(T, N, O, V) \ jit_movi##T(_jit, JIT_F0, V); \ jit_movi(_jit, JIT_R0, O); \ jit_stxr##T(_jit, JIT_R0, JIT_V0, JIT_F0); #define stf8(T, M, V) \ stf(T, 3, (M##B3), V) \ stf(T, 4, (M##B4), V) \ stf(T, 5, (M##B5), V) \ stf(T, 6, (M##B6), V) \ stf(T, 7, (M##B7), V) \ stf(T, 8, (M##B8), V) \ stf(T, 9, (M##B9), V) \ stf(T, 10, (M##B10), V) \ stf(T, 11, (M##B11), V) \ stf(T, 12, (M##B12), V) \ stf(T, 13, (M##B13), V) \ stf(T, 14, (M##B14), V) \ stf(T, 15, (M##B15), V) \ stf(T, 16, (M##B16), V) \ stf(T, 17, (M##B17), V) \ stf(T, 18, (M##B18), V) \ stf(T, 19, (M##B19), V) \ stf(T, 20, (M##B20), V) \ stf(T, 21, (M##B21), V) \ stf(T, 22, (M##B22), V) \ stf(T, 23, (M##B23), V) \ stf(T, 24, (M##B24), V) \ stf(T, 25, (M##B25), V) \ stf(T, 26, (M##B26), V) #define stf4(T, M, V) \ stf(T, 2, (M##B2), V) \ stf8(T, M, V) #define ldf(T, N, M, O, V) \ { \ dump_args(T, N, M, O, V); \ jit_movi##T(_jit, JIT_F0, 0); \ jit_ldxi##T(_jit, JIT_F0, JIT_V0, O); \ jit_movi##T(_jit, JIT_F1, V); \ jit_reloc_t r = jit_beqr##T(_jit, JIT_F0, JIT_F1); \ jit_calli_0(_jit, abort); \ jit_patch_here(_jit, r); \ } #define ldf8(T, M, V) \ ldf(T, 3, M, (M##B3), V) \ ldf(T, 4, M, (M##B4), V) \ ldf(T, 5, M, (M##B5), V) \ ldf(T, 6, M, (M##B6), V) \ ldf(T, 7, M, (M##B7), V) \ ldf(T, 8, M, (M##B8), V) \ ldf(T, 9, M, (M##B9), V) \ ldf(T, 10, M, (M##B10), V) \ ldf(T, 11, M, (M##B11), V) \ ldf(T, 12, M, (M##B12), V) \ ldf(T, 13, M, (M##B13), V) \ ldf(T, 14, M, (M##B14), V) \ ldf(T, 15, M, (M##B15), V) \ ldf(T, 16, M, (M##B16), V) \ ldf(T, 17, M, (M##B17), V) \ ldf(T, 18, M, (M##B18), V) \ ldf(T, 19, M, (M##B19), V) \ ldf(T, 20, M, (M##B20), V) \ ldf(T, 21, M, (M##B21), V) \ ldf(T, 22, M, (M##B22), V) \ ldf(T, 23, M, (M##B23), V) \ ldf(T, 24, M, (M##B24), V) \ ldf(T, 25, M, (M##B25), V) \ ldf(T, 26, M, (M##B26), V) #define ldf4(T, M, V) \ ldf(T, 2, M, (M##B2), V) \ ldf8(T, M, V) #define ldst_c() \ reset(0xa5) \ jit_movi(_jit, JIT_V0, (jit_imm_t)buf); \ stx2(_c, a, 0x5a) \ ldx2(_c, a, 0x5a) \ reset(0xa5) \ jit_movi(_jit, JIT_V0, (jit_imm_t)(buf + M64)); \ stx2(_c, b, 0x5a) \ ldx2(_c, b, 0x5a) #define ldst_uc() \ reset(0xa5) \ jit_movi(_jit, JIT_V0, (jit_imm_t)buf); \ stx2(_c, a, 0x5a) \ ldx2(_uc, a, 0x5a) \ jit_movi(_jit, JIT_V0, (jit_imm_t)(buf + M64)); \ stx2(_c, b, 0x5a) \ ldx2(_uc, b, 0x5a) #define ldst_s() \ reset(0xa5) \ jit_movi(_jit, JIT_V0, (jit_imm_t)buf); \ stx2(_s, a, 0x5a5a) \ ldx2(_s, a, 0x5a5a) \ reset(0xa5) \ jit_movi(_jit, JIT_V0, (jit_imm_t)(buf + M64)); \ stx2(_s, b, 0x5a5a) \ ldx2(_s, b, 0x5a5a) #define ldst_us() \ reset(0xa5) \ jit_movi(_jit, JIT_V0, (jit_imm_t)buf); \ stx2(_s, a, 0x5a5a) \ ldx2(_us, a, 0x5a5a) \ reset(0xa5) \ jit_movi(_jit, JIT_V0, (jit_imm_t)(buf + M64)); \ stx2(_s, b, 0x5a5a) \ ldx2(_us, b, 0x5a5a) #define ldst_i() \ reset(0xa5) \ jit_movi(_jit, JIT_V0, (jit_imm_t)buf); \ stx4(_i, a, 0x5a5a5a5a) \ ldx4(_i, a, 0x5a5a5a5a) \ reset(0xa5) \ jit_movi(_jit, JIT_V0, (jit_imm_t)(buf + M64)); \ stx4(_i, b, 0x5a5a5a5a) \ ldx4(_i, b, 0x5a5a5a5a) #define ldst_ui() \ reset(0xa5) \ jit_movi(_jit, JIT_V0, (jit_imm_t)buf); \ stx4(_i, a, 0x5a5a5a5a) \ ldx4(_ui, a, 0x5a5a5a5a) \ reset(0xa5) \ jit_movi(_jit, JIT_V0, (jit_imm_t)(buf + M64)); \ stx4(_i, b, 0x5a5a5a5a) \ ldx4(_ui, b, 0x5a5a5a5a) #define ldst_l() \ reset(0xa5) \ jit_movi(_jit, JIT_V0, (jit_imm_t)buf); \ stx8(_l, a, 0x5a5a5a5a5a5a5a5a) \ ldx8(_l, a, 0x5a5a5a5a5a5a5a5a) \ reset(0xa5) \ jit_movi(_jit, JIT_V0, (jit_imm_t)(buf + M64)); \ stx8(_l, b, 0x5a5a5a5a5a5a5a5a) \ ldx8(_l, b, 0x5a5a5a5a5a5a5a5a) #define ldst_f() \ reset(0xa5) \ jit_movi(_jit, JIT_V0, (jit_imm_t)buf); \ stf4(_f, a, 0.5) \ ldf4(_f, a, 0.5) \ reset(0xa5) \ jit_movi(_jit, JIT_V0, (jit_imm_t)(buf + M64)); \ stf4(_f, b, 0.5) \ ldf4(_f, b, 0.5) #define ldst_d() \ reset(0xa5) \ jit_movi(_jit, JIT_V0, (jit_imm_t)buf); \ stf8(_d, a, 0.5) \ ldf8(_d, a, 0.5) \ reset(0xa5) \ jit_movi(_jit, JIT_V0, (jit_imm_t)(buf + M64)); \ stf8(_d, b, 0.5) \ ldf8(_d, b, 0.5) static size_t run_test(jit_state_t *_jit, uint8_t *arena_base, size_t arena_size) { jit_begin(_jit, arena_base, arena_size); size_t frame = jit_enter_jit_abi(_jit, 3, 0, 0); void (*function)(void); char *buf = malloc(M64 + 8); ASSERT(buf); alu(add) alu(sub) alu(mul) alu(div) alu(rem) lsh() rsh() alu(and) alu(or) alu(xor) ldst_c() ldst_uc() ldst_s() ldst_us() ldst_i() #if __WORDSIZE == 64 ldst_ui() ldst_l() #endif ldst_f() ldst_d() jit_leave_jit_abi(_jit, 3, 0, frame); jit_ret(_jit); size_t size = 0; function = jit_end(_jit, &size); if (function) (*function)(); else { free(buf); return size; } free(buf); return 0; } int main(int argc, char *argv[]) { return main_compiler(argc, argv, run_test); }