diff options
Diffstat (limited to 'deps/lightening/tests/z_ranger.c')
-rw-r--r-- | deps/lightening/tests/z_ranger.c | 580 |
1 files changed, 580 insertions, 0 deletions
diff --git a/deps/lightening/tests/z_ranger.c b/deps/lightening/tests/z_ranger.c new file mode 100644 index 0000000..aa9eadd --- /dev/null +++ b/deps/lightening/tests/z_ranger.c @@ -0,0 +1,580 @@ +#include "test.h" + +#define M64 67108864 + +#define aB1 (1<<1) +#define aB2 (1<<2) +#define aB3 (1<<3) +#define aB4 (1<<4) +#define aB5 (1<<5) +#define aB6 (1<<6) +#define aB7 (1<<7) +#define aB8 (1<<8) +#define aB9 (1<<9) +#define aB10 (1<<10) +#define aB11 (1<<11) +#define aB12 (1<<12) +#define aB13 (1<<13) +#define aB14 (1<<14) +#define aB15 (1<<15) +#define aB16 (1<<16) +#define aB17 (1<<17) +#define aB18 (1<<18) +#define aB19 (1<<19) +#define aB20 (1<<20) +#define aB21 (1<<21) +#define aB22 (1<<22) +#define aB23 (1<<23) +#define aB24 (1<<24) +#define aB25 (1<<25) +#define aB26 (1<<26) +#define bB1 (-aB1) +#define bB2 (-aB2) +#define bB3 (-aB3) +#define bB4 (-aB4) +#define bB5 (-aB5) +#define bB6 (-aB6) +#define bB7 (-aB7) +#define bB8 (-aB8) +#define bB9 (-aB9) +#define bB10 (-aB10) +#define bB11 (-aB11) +#define bB12 (-aB12) +#define bB13 (-aB13) +#define bB14 (-aB14) +#define bB15 (-aB15) +#define bB16 (-aB16) +#define bB17 (-aB17) +#define bB18 (-aB18) +#define bB19 (-aB19) +#define bB20 (-aB20) +#define bB21 (-aB21) +#define bB22 (-aB22) +#define bB23 (-aB23) +#define bB24 (-aB24) +#define bB25 (-aB25) +#define bB26 (-aB26) +#define cB1 (aB1-1) +#define cB2 (aB2-1) +#define cB3 (aB3-1) +#define cB4 (aB4-1) +#define cB5 (aB5-1) +#define cB6 (aB6-1) +#define cB7 (aB7-1) +#define cB8 (aB8-1) +#define cB9 (aB9-1) +#define cB10 (aB10-1) +#define cB11 (aB11-1) +#define cB12 (aB12-1) +#define cB13 (aB13-1) +#define cB14 (aB14-1) +#define cB15 (aB15-1) +#define cB16 (aB16-1) +#define cB17 (aB17-1) +#define cB18 (aB18-1) +#define cB19 (aB19-1) +#define cB20 (aB20-1) +#define cB21 (aB21-1) +#define cB22 (aB22-1) +#define cB23 (aB23-1) +#define cB24 (aB24-1) +#define cB25 (aB25-1) +#define cB26 (aB26-1) +#define dB1 (-aB1+1) +#define dB2 (-aB2+1) +#define dB3 (-aB3+1) +#define dB4 (-aB4+1) +#define dB5 (-aB5+1) +#define dB6 (-aB6+1) +#define dB7 (-aB7+1) +#define dB8 (-aB8+1) +#define dB9 (-aB9+1) +#define dB10 (-aB10+1) +#define dB11 (-aB11+1) +#define dB12 (-aB12+1) +#define dB13 (-aB13+1) +#define dB14 (-aB14+1) +#define dB15 (-aB15+1) +#define dB16 (-aB16+1) +#define dB17 (-aB17+1) +#define dB18 (-aB18+1) +#define dB19 (-aB19+1) +#define dB20 (-aB20+1) +#define dB21 (-aB21+1) +#define dB22 (-aB22+1) +#define dB23 (-aB23+1) +#define dB24 (-aB24+1) +#define dB25 (-aB25+1) +#define dB26 (-aB26+1) + +#define add(a, b) (a + b) +#define sub(a, b) (a - b) +#define mul(a, b) (a * b) +#define div(a, b) (a / b) +#define rem(a, b) (a % b) +#define and(a, b) (a & b) +#define or(a, b) (a | b) +#define xor(a, b) (a ^ b) + +#if defined(DEBUG) +#define dump_args(N, X, L, R, V)\ + jit_calli_1(_jit, puts,\ + jit_operand_imm(JIT_OPERAND_ABI_POINTER,\ + (jit_imm_t)#N " " #X " " #L " " #R " " #V)) +#else +#define dump_args(N, X, L, R, V) +#endif + +#define jit_rshi_ui jit_rshi_u + +#define alu2(N, X, L, R, V) \ +{ \ + dump_args(N, X, L, R, V); \ + jit_movi(_jit, JIT_R1, L); \ + jit_movi(_jit, JIT_R2, R); \ + jit_##N##r(_jit, JIT_R0, JIT_R1, JIT_R2); \ + jit_reloc_t r = jit_beqi(_jit, JIT_R0, V); \ + jit_calli_0(_jit, abort); \ + jit_patch_here(_jit, r); \ +} + +#define alu1(N, M) \ + alu2(N, N##M##1, 3, (M##1), N(3, M##1)) \ + alu2(N, N##M##2, 3, (M##2), N(3, M##2)) \ + alu2(N, N##M##3, 3, (M##3), N(3, M##3)) \ + alu2(N, N##M##4, 3, (M##4), N(3, M##4)) \ + alu2(N, N##M##5, 3, (M##5), N(3, M##5)) \ + alu2(N, N##M##6, 3, (M##6), N(3, M##6)) \ + alu2(N, N##M##7, 3, (M##7), N(3, M##7)) \ + alu2(N, N##M##8, 3, (M##8), N(3, M##8)) \ + alu2(N, N##M##9, 3, (M##9), N(3, M##9)) \ + alu2(N, N##M##10, 3, (M##10), N(3, M##10)) \ + alu2(N, N##M##11, 3, (M##11), N(3, M##11)) \ + alu2(N, N##M##12, 3, (M##12), N(3, M##12)) \ + alu2(N, N##M##13, 3, (M##13), N(3, M##13)) \ + alu2(N, N##M##14, 3, (M##14), N(3, M##14)) \ + alu2(N, N##M##15, 3, (M##15), N(3, M##15)) \ + alu2(N, N##M##16, 3, (M##16), N(3, M##16)) \ + alu2(N, N##M##17, 3, (M##17), N(3, M##17)) \ + alu2(N, N##M##18, 3, (M##18), N(3, M##18)) \ + alu2(N, N##M##19, 3, (M##19), N(3, M##19)) \ + alu2(N, N##M##20, 3, (M##20), N(3, M##20)) \ + alu2(N, N##M##21, 3, (M##21), N(3, M##21)) \ + alu2(N, N##M##22, 3, (M##22), N(3, M##22)) \ + alu2(N, N##M##23, 3, (M##23), N(3, M##23)) \ + alu2(N, N##M##24, 3, (M##24), N(3, M##24)) \ + alu2(N, N##M##25, 3, (M##25), N(3, M##25)) \ + alu2(N, N##M##26, 3, (M##26), N(3, M##26)) + +#define alu(N) \ + alu1(N, aB) \ + alu1(N, bB) \ + alu1(N, cB) \ + alu1(N, dB) + +#define _lsh(N) \ + alu2(lsh, L##N, 1, N, (1L<<N)) + +#if __WORDSIZE == 64 +#define _rsh(N) \ + alu2(rsh, R##N, (1L<<63), N, ((1L<<63)>>N)) + +#define _rush(N) \ + alu2(rsh_u, R##N, (1UL<<63), N, ((1UL<<63)>>N)) +#else +#define _rsh(N) \ + alu2(rsh, R##N, (1L<<31), N, ((1L<<31)>>N)) + +#define _rush(N) \ + alu2(rsh_u, R##N, (1UL<<31), N, ((1UL<<31)>>N)) +#endif + +#if __WORDSIZE == 32 +# define xsh64(X) /**/ +#else +# define xsh64(X) \ + _##X##sh(32) \ + _##X##sh(33) \ + _##X##sh(34) \ + _##X##sh(35) \ + _##X##sh(36) \ + _##X##sh(37) \ + _##X##sh(38) \ + _##X##sh(39) \ + _##X##sh(40) \ + _##X##sh(41) \ + _##X##sh(42) \ + _##X##sh(43) \ + _##X##sh(44) \ + _##X##sh(45) \ + _##X##sh(46) \ + _##X##sh(47) \ + _##X##sh(48) \ + _##X##sh(49) \ + _##X##sh(50) \ + _##X##sh(51) \ + _##X##sh(52) \ + _##X##sh(53) \ + _##X##sh(54) \ + _##X##sh(55) \ + _##X##sh(56) \ + _##X##sh(57) \ + _##X##sh(58) \ + _##X##sh(59) \ + _##X##sh(60) \ + _##X##sh(61) \ + _##X##sh(62) \ + _##X##sh(63) +#endif + +#define xsh(X) \ + _##X##sh(0) \ + _##X##sh(1) \ + _##X##sh(2) \ + _##X##sh(3) \ + _##X##sh(4) \ + _##X##sh(5) \ + _##X##sh(6) \ + _##X##sh(7) \ + _##X##sh(8) \ + _##X##sh(9) \ + _##X##sh(10) \ + _##X##sh(11) \ + _##X##sh(12) \ + _##X##sh(13) \ + _##X##sh(14) \ + _##X##sh(15) \ + _##X##sh(16) \ + _##X##sh(17) \ + _##X##sh(18) \ + _##X##sh(19) \ + _##X##sh(20) \ + _##X##sh(21) \ + _##X##sh(22) \ + _##X##sh(23) \ + _##X##sh(24) \ + _##X##sh(25) \ + _##X##sh(26) \ + _##X##sh(27) \ + _##X##sh(28) \ + _##X##sh(29) \ + _##X##sh(30) \ + _##X##sh(31) \ + xsh64(X) + +#define lsh() \ + xsh(l) + +#define rsh() \ + xsh(r) + +#define rsh_u() \ + xsh(ru) + +#define reset(V) \ + jit_calli_3(_jit, memset, \ + jit_operand_imm(JIT_OPERAND_ABI_POINTER, (jit_imm_t)buf),\ + jit_operand_imm(JIT_OPERAND_ABI_INT32, V), \ + jit_operand_imm(JIT_OPERAND_ABI_UINT32, M64 + 8)); + +#define stx(T, N, O, V) \ + jit_movi(_jit, JIT_R0, V); \ + jit_movi(_jit, JIT_R1, O); \ + jit_stxr##T(_jit, JIT_R1, JIT_V0, JIT_R0); + +#define stx8(T, M, V) \ + stx(T, 3, (M##B3), V) \ + stx(T, 4, (M##B4), V) \ + stx(T, 5, (M##B5), V) \ + stx(T, 6, (M##B6), V) \ + stx(T, 7, (M##B7), V) \ + stx(T, 8, (M##B8), V) \ + stx(T, 9, (M##B9), V) \ + stx(T, 10, (M##B10), V) \ + stx(T, 11, (M##B11), V) \ + stx(T, 12, (M##B12), V) \ + stx(T, 13, (M##B13), V) \ + stx(T, 14, (M##B14), V) \ + stx(T, 15, (M##B15), V) \ + stx(T, 16, (M##B16), V) \ + stx(T, 17, (M##B17), V) \ + stx(T, 18, (M##B18), V) \ + stx(T, 19, (M##B19), V) \ + stx(T, 20, (M##B20), V) \ + stx(T, 21, (M##B21), V) \ + stx(T, 22, (M##B22), V) \ + stx(T, 23, (M##B23), V) \ + stx(T, 24, (M##B24), V) \ + stx(T, 25, (M##B25), V) \ + stx(T, 26, (M##B26), V) + +#define stx4(T, M, V) \ + stx(T, 2, (M##B2), V) \ + stx8(T, M, V) + +#define stx2(T, M, V) \ + stx(T, 1, (M##B1), V) \ + stx4(T, M, V) + +#define ldx(T, N, M, O, V) \ +{ \ + dump_args(T, N, M, O, V); \ + jit_movi(_jit, JIT_R0, 0); \ + jit_ldxi##T(_jit, JIT_R0, JIT_V0, O); \ + jit_reloc_t r = jit_beqi(_jit, JIT_R0, V); \ + jit_calli_0(_jit, abort); \ + jit_patch_here(_jit, r); \ +} + +#define ldx8(T, M, V) \ + ldx(T, 3, M, (M##B3), V) \ + ldx(T, 4, M, (M##B4), V) \ + ldx(T, 5, M, (M##B5), V) \ + ldx(T, 6, M, (M##B6), V) \ + ldx(T, 7, M, (M##B7), V) \ + ldx(T, 8, M, (M##B8), V) \ + ldx(T, 9, M, (M##B9), V) \ + ldx(T, 10, M, (M##B10), V) \ + ldx(T, 11, M, (M##B11), V) \ + ldx(T, 12, M, (M##B12), V) \ + ldx(T, 13, M, (M##B13), V) \ + ldx(T, 14, M, (M##B14), V) \ + ldx(T, 15, M, (M##B15), V) \ + ldx(T, 16, M, (M##B16), V) \ + ldx(T, 17, M, (M##B17), V) \ + ldx(T, 18, M, (M##B18), V) \ + ldx(T, 19, M, (M##B19), V) \ + ldx(T, 20, M, (M##B20), V) \ + ldx(T, 21, M, (M##B21), V) \ + ldx(T, 22, M, (M##B22), V) \ + ldx(T, 23, M, (M##B23), V) \ + ldx(T, 24, M, (M##B24), V) \ + ldx(T, 25, M, (M##B25), V) \ + ldx(T, 26, M, (M##B26), V) + +#define ldx4(T, M, V) \ + ldx(T, 2, M, (M##B2), V) \ + ldx8(T, M, V) + +#define ldx2(T, M, V) \ + ldx(T, 1, M, (M##B1), V) \ + ldx4(T, M, V) + +#define stf(T, N, O, V) \ + jit_movi##T(_jit, JIT_F0, V); \ + jit_movi(_jit, JIT_R0, O); \ + jit_stxr##T(_jit, JIT_R0, JIT_V0, JIT_F0); + +#define stf8(T, M, V) \ + stf(T, 3, (M##B3), V) \ + stf(T, 4, (M##B4), V) \ + stf(T, 5, (M##B5), V) \ + stf(T, 6, (M##B6), V) \ + stf(T, 7, (M##B7), V) \ + stf(T, 8, (M##B8), V) \ + stf(T, 9, (M##B9), V) \ + stf(T, 10, (M##B10), V) \ + stf(T, 11, (M##B11), V) \ + stf(T, 12, (M##B12), V) \ + stf(T, 13, (M##B13), V) \ + stf(T, 14, (M##B14), V) \ + stf(T, 15, (M##B15), V) \ + stf(T, 16, (M##B16), V) \ + stf(T, 17, (M##B17), V) \ + stf(T, 18, (M##B18), V) \ + stf(T, 19, (M##B19), V) \ + stf(T, 20, (M##B20), V) \ + stf(T, 21, (M##B21), V) \ + stf(T, 22, (M##B22), V) \ + stf(T, 23, (M##B23), V) \ + stf(T, 24, (M##B24), V) \ + stf(T, 25, (M##B25), V) \ + stf(T, 26, (M##B26), V) + +#define stf4(T, M, V) \ + stf(T, 2, (M##B2), V) \ + stf8(T, M, V) + +#define ldf(T, N, M, O, V) \ +{ \ + dump_args(T, N, M, O, V); \ + jit_movi##T(_jit, JIT_F0, 0); \ + jit_ldxi##T(_jit, JIT_F0, JIT_V0, O); \ + jit_movi##T(_jit, JIT_F1, V); \ + jit_reloc_t r = jit_beqr##T(_jit, JIT_F0, JIT_F1); \ + jit_calli_0(_jit, abort); \ + jit_patch_here(_jit, r); \ +} + +#define ldf8(T, M, V) \ + ldf(T, 3, M, (M##B3), V) \ + ldf(T, 4, M, (M##B4), V) \ + ldf(T, 5, M, (M##B5), V) \ + ldf(T, 6, M, (M##B6), V) \ + ldf(T, 7, M, (M##B7), V) \ + ldf(T, 8, M, (M##B8), V) \ + ldf(T, 9, M, (M##B9), V) \ + ldf(T, 10, M, (M##B10), V) \ + ldf(T, 11, M, (M##B11), V) \ + ldf(T, 12, M, (M##B12), V) \ + ldf(T, 13, M, (M##B13), V) \ + ldf(T, 14, M, (M##B14), V) \ + ldf(T, 15, M, (M##B15), V) \ + ldf(T, 16, M, (M##B16), V) \ + ldf(T, 17, M, (M##B17), V) \ + ldf(T, 18, M, (M##B18), V) \ + ldf(T, 19, M, (M##B19), V) \ + ldf(T, 20, M, (M##B20), V) \ + ldf(T, 21, M, (M##B21), V) \ + ldf(T, 22, M, (M##B22), V) \ + ldf(T, 23, M, (M##B23), V) \ + ldf(T, 24, M, (M##B24), V) \ + ldf(T, 25, M, (M##B25), V) \ + ldf(T, 26, M, (M##B26), V) +#define ldf4(T, M, V) \ + ldf(T, 2, M, (M##B2), V) \ + ldf8(T, M, V) + +#define ldst_c() \ + reset(0xa5) \ + jit_movi(_jit, JIT_V0, (jit_imm_t)buf); \ + stx2(_c, a, 0x5a) \ + ldx2(_c, a, 0x5a) \ + reset(0xa5) \ + jit_movi(_jit, JIT_V0, (jit_imm_t)(buf + M64)); \ + stx2(_c, b, 0x5a) \ + ldx2(_c, b, 0x5a) + +#define ldst_uc() \ + reset(0xa5) \ + jit_movi(_jit, JIT_V0, (jit_imm_t)buf); \ + stx2(_c, a, 0x5a) \ + ldx2(_uc, a, 0x5a) \ + jit_movi(_jit, JIT_V0, (jit_imm_t)(buf + M64)); \ + stx2(_c, b, 0x5a) \ + ldx2(_uc, b, 0x5a) + +#define ldst_s() \ + reset(0xa5) \ + jit_movi(_jit, JIT_V0, (jit_imm_t)buf); \ + stx2(_s, a, 0x5a5a) \ + ldx2(_s, a, 0x5a5a) \ + reset(0xa5) \ + jit_movi(_jit, JIT_V0, (jit_imm_t)(buf + M64)); \ + stx2(_s, b, 0x5a5a) \ + ldx2(_s, b, 0x5a5a) + +#define ldst_us() \ + reset(0xa5) \ + jit_movi(_jit, JIT_V0, (jit_imm_t)buf); \ + stx2(_s, a, 0x5a5a) \ + ldx2(_us, a, 0x5a5a) \ + reset(0xa5) \ + jit_movi(_jit, JIT_V0, (jit_imm_t)(buf + M64)); \ + stx2(_s, b, 0x5a5a) \ + ldx2(_us, b, 0x5a5a) + +#define ldst_i() \ + reset(0xa5) \ + jit_movi(_jit, JIT_V0, (jit_imm_t)buf); \ + stx4(_i, a, 0x5a5a5a5a) \ + ldx4(_i, a, 0x5a5a5a5a) \ + reset(0xa5) \ + jit_movi(_jit, JIT_V0, (jit_imm_t)(buf + M64)); \ + stx4(_i, b, 0x5a5a5a5a) \ + ldx4(_i, b, 0x5a5a5a5a) + +#define ldst_ui() \ + reset(0xa5) \ + jit_movi(_jit, JIT_V0, (jit_imm_t)buf); \ + stx4(_i, a, 0x5a5a5a5a) \ + ldx4(_ui, a, 0x5a5a5a5a) \ + reset(0xa5) \ + jit_movi(_jit, JIT_V0, (jit_imm_t)(buf + M64)); \ + stx4(_i, b, 0x5a5a5a5a) \ + ldx4(_ui, b, 0x5a5a5a5a) + +#define ldst_l() \ + reset(0xa5) \ + jit_movi(_jit, JIT_V0, (jit_imm_t)buf); \ + stx8(_l, a, 0x5a5a5a5a5a5a5a5a) \ + ldx8(_l, a, 0x5a5a5a5a5a5a5a5a) \ + reset(0xa5) \ + jit_movi(_jit, JIT_V0, (jit_imm_t)(buf + M64)); \ + stx8(_l, b, 0x5a5a5a5a5a5a5a5a) \ + ldx8(_l, b, 0x5a5a5a5a5a5a5a5a) + +#define ldst_f() \ + reset(0xa5) \ + jit_movi(_jit, JIT_V0, (jit_imm_t)buf); \ + stf4(_f, a, 0.5) \ + ldf4(_f, a, 0.5) \ + reset(0xa5) \ + jit_movi(_jit, JIT_V0, (jit_imm_t)(buf + M64)); \ + stf4(_f, b, 0.5) \ + ldf4(_f, b, 0.5) + +#define ldst_d() \ + reset(0xa5) \ + jit_movi(_jit, JIT_V0, (jit_imm_t)buf); \ + stf8(_d, a, 0.5) \ + ldf8(_d, a, 0.5) \ + reset(0xa5) \ + jit_movi(_jit, JIT_V0, (jit_imm_t)(buf + M64)); \ + stf8(_d, b, 0.5) \ + ldf8(_d, b, 0.5) + +static size_t +run_test(jit_state_t *_jit, uint8_t *arena_base, size_t arena_size) +{ + jit_begin(_jit, arena_base, arena_size); + size_t frame = jit_enter_jit_abi(_jit, 3, 0, 0); + + void (*function)(void); + + char *buf = malloc(M64 + 8); + ASSERT(buf); + + alu(add) + alu(sub) + alu(mul) + alu(div) + alu(rem) + lsh() + rsh() + alu(and) + alu(or) + alu(xor) + ldst_c() + ldst_uc() + ldst_s() + ldst_us() + ldst_i() +#if __WORDSIZE == 64 + ldst_ui() + ldst_l() +#endif + ldst_f() + ldst_d() + + jit_leave_jit_abi(_jit, 3, 0, frame); + jit_ret(_jit); + + size_t size = 0; + function = jit_end(_jit, &size); + + if (function) + (*function)(); + else { + free(buf); + return size; + } + + free(buf); + return 0; +} + +int main(int argc, char *argv[]) +{ + return main_compiler(argc, argv, run_test); +} |