Path: blob/master/thirdparty/pcre2/deps/sljit/sljit_src/sljitNativeMIPS_64.c
9913 views
/*1* Stack-less Just-In-Time compiler2*3* Copyright Zoltan Herczeg ([email protected]). All rights reserved.4*5* Redistribution and use in source and binary forms, with or without modification, are6* permitted provided that the following conditions are met:7*8* 1. Redistributions of source code must retain the above copyright notice, this list of9* conditions and the following disclaimer.10*11* 2. Redistributions in binary form must reproduce the above copyright notice, this list12* of conditions and the following disclaimer in the documentation and/or other materials13* provided with the distribution.14*15* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDER(S) AND CONTRIBUTORS ``AS IS'' AND ANY16* EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES17* OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT18* SHALL THE COPYRIGHT HOLDER(S) OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,19* INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED20* TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR21* BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN22* CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN23* ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.24*/2526/* mips 64-bit arch dependent functions. */2728static sljit_s32 emit_copysign(struct sljit_compiler *compiler, sljit_s32 op,29sljit_s32 src1, sljit_s32 src2, sljit_s32 dst)30{31FAIL_IF(push_inst(compiler, SELECT_OP(DMFC1, MFC1) | T(TMP_REG1) | FS(src1), DR(TMP_REG1)));32FAIL_IF(push_inst(compiler, SELECT_OP(DMFC1, MFC1) | T(TMP_REG2) | FS(src2), DR(TMP_REG2)));33FAIL_IF(push_inst(compiler, XOR | S(TMP_REG2) | T(TMP_REG1) | D(TMP_REG2), DR(TMP_REG2)));34FAIL_IF(push_inst(compiler, SELECT_OP(DSRL32, SRL) | T(TMP_REG2) | D(TMP_REG2) | SH_IMM(31), DR(TMP_REG2)));35FAIL_IF(push_inst(compiler, SELECT_OP(DSLL32, SLL) | T(TMP_REG2) | D(TMP_REG2) | SH_IMM(31), DR(TMP_REG2)));36FAIL_IF(push_inst(compiler, XOR | S(TMP_REG1) | T(TMP_REG2) | D(TMP_REG1), DR(TMP_REG1)));37FAIL_IF(push_inst(compiler, SELECT_OP(DMTC1, MTC1) | T(TMP_REG1) | FS(dst), MOVABLE_INS));38#if !defined(SLJIT_MIPS_REV) || SLJIT_MIPS_REV <= 139if (!(op & SLJIT_32))40return push_inst(compiler, NOP, UNMOVABLE_INS);41#endif /* MIPS III */42return SLJIT_SUCCESS;43}4445static sljit_s32 load_immediate(struct sljit_compiler *compiler, sljit_s32 dst_ar, sljit_sw imm)46{47sljit_s32 shift = 32;48sljit_s32 shift2;49sljit_s32 inv = 0;50sljit_ins ins;51sljit_uw uimm;5253if (!(imm & ~0xffff))54return push_inst(compiler, ORI | SA(0) | TA(dst_ar) | IMM(imm), dst_ar);5556if (imm < 0 && imm >= SIMM_MIN)57return push_inst(compiler, ADDIU | SA(0) | TA(dst_ar) | IMM(imm), dst_ar);5859if (imm <= 0x7fffffffl && imm >= -0x80000000l) {60FAIL_IF(push_inst(compiler, LUI | TA(dst_ar) | IMM(imm >> 16), dst_ar));61return (imm & 0xffff) ? push_inst(compiler, ORI | SA(dst_ar) | TA(dst_ar) | IMM(imm), dst_ar) : SLJIT_SUCCESS;62}6364/* Zero extended number. */65uimm = (sljit_uw)imm;66if (imm < 0) {67uimm = ~(sljit_uw)imm;68inv = 1;69}7071while (!(uimm & 0xff00000000000000l)) {72shift -= 8;73uimm <<= 8;74}7576if (!(uimm & 0xf000000000000000l)) {77shift -= 4;78uimm <<= 4;79}8081if (!(uimm & 0xc000000000000000l)) {82shift -= 2;83uimm <<= 2;84}8586if ((sljit_sw)uimm < 0) {87uimm >>= 1;88shift += 1;89}90SLJIT_ASSERT(((uimm & 0xc000000000000000l) == 0x4000000000000000l) && (shift > 0) && (shift <= 32));9192if (inv)93uimm = ~uimm;9495FAIL_IF(push_inst(compiler, LUI | TA(dst_ar) | IMM(uimm >> 48), dst_ar));96if (uimm & 0x0000ffff00000000l)97FAIL_IF(push_inst(compiler, ORI | SA(dst_ar) | TA(dst_ar) | IMM(uimm >> 32), dst_ar));9899imm &= (1l << shift) - 1;100if (!(imm & ~0xffff)) {101ins = (shift == 32) ? DSLL32 : DSLL;102if (shift < 32)103ins |= SH_IMM(shift);104FAIL_IF(push_inst(compiler, ins | TA(dst_ar) | DA(dst_ar), dst_ar));105return !(imm & 0xffff) ? SLJIT_SUCCESS : push_inst(compiler, ORI | SA(dst_ar) | TA(dst_ar) | IMM(imm), dst_ar);106}107108/* Double shifts needs to be performed. */109uimm <<= 32;110shift2 = shift - 16;111112while (!(uimm & 0xf000000000000000l)) {113shift2 -= 4;114uimm <<= 4;115}116117if (!(uimm & 0xc000000000000000l)) {118shift2 -= 2;119uimm <<= 2;120}121122if (!(uimm & 0x8000000000000000l)) {123shift2--;124uimm <<= 1;125}126127SLJIT_ASSERT((uimm & 0x8000000000000000l) && (shift2 > 0) && (shift2 <= 16));128129FAIL_IF(push_inst(compiler, DSLL | TA(dst_ar) | DA(dst_ar) | SH_IMM(shift - shift2), dst_ar));130FAIL_IF(push_inst(compiler, ORI | SA(dst_ar) | TA(dst_ar) | IMM(uimm >> 48), dst_ar));131FAIL_IF(push_inst(compiler, DSLL | TA(dst_ar) | DA(dst_ar) | SH_IMM(shift2), dst_ar));132133imm &= (1l << shift2) - 1;134return !(imm & 0xffff) ? SLJIT_SUCCESS : push_inst(compiler, ORI | SA(dst_ar) | TA(dst_ar) | IMM(imm), dst_ar);135}136137static SLJIT_INLINE sljit_s32 emit_const(struct sljit_compiler *compiler, sljit_s32 dst, sljit_sw init_value)138{139FAIL_IF(push_inst(compiler, LUI | T(dst) | IMM(init_value >> 48), DR(dst)));140FAIL_IF(push_inst(compiler, ORI | S(dst) | T(dst) | IMM(init_value >> 32), DR(dst)));141FAIL_IF(push_inst(compiler, DSLL | T(dst) | D(dst) | SH_IMM(16), DR(dst)));142FAIL_IF(push_inst(compiler, ORI | S(dst) | T(dst) | IMM(init_value >> 16), DR(dst)));143FAIL_IF(push_inst(compiler, DSLL | T(dst) | D(dst) | SH_IMM(16), DR(dst)));144return push_inst(compiler, ORI | S(dst) | T(dst) | IMM(init_value), DR(dst));145}146147SLJIT_API_FUNC_ATTRIBUTE sljit_s32 sljit_emit_fset64(struct sljit_compiler *compiler,148sljit_s32 freg, sljit_f64 value)149{150union {151sljit_sw imm;152sljit_f64 value;153} u;154155CHECK_ERROR();156CHECK(check_sljit_emit_fset64(compiler, freg, value));157158u.value = value;159160if (u.imm == 0) {161FAIL_IF(push_inst(compiler, DMTC1 | TA(0) | FS(freg), MOVABLE_INS));162#if !defined(SLJIT_MIPS_REV) || SLJIT_MIPS_REV <= 1163FAIL_IF(push_inst(compiler, NOP, UNMOVABLE_INS));164#endif /* MIPS III */165return SLJIT_SUCCESS;166}167168FAIL_IF(load_immediate(compiler, DR(TMP_REG1), u.imm));169FAIL_IF(push_inst(compiler, DMTC1 | T(TMP_REG1) | FS(freg), MOVABLE_INS));170#if !defined(SLJIT_MIPS_REV) || SLJIT_MIPS_REV <= 1171FAIL_IF(push_inst(compiler, NOP, UNMOVABLE_INS));172#endif /* MIPS III */173return SLJIT_SUCCESS;174}175176SLJIT_API_FUNC_ATTRIBUTE sljit_s32 sljit_emit_fcopy(struct sljit_compiler *compiler, sljit_s32 op,177sljit_s32 freg, sljit_s32 reg)178{179sljit_ins inst;180181CHECK_ERROR();182CHECK(check_sljit_emit_fcopy(compiler, op, freg, reg));183184inst = T(reg) | FS(freg);185186if (GET_OPCODE(op) == SLJIT_COPY_TO_F64)187FAIL_IF(push_inst(compiler, SELECT_OP(DMTC1, MTC1) | inst, MOVABLE_INS));188else189FAIL_IF(push_inst(compiler, SELECT_OP(DMFC1, MFC1) | inst, DR(reg)));190191#if !defined(SLJIT_MIPS_REV) || SLJIT_MIPS_REV <= 1192if (!(op & SLJIT_32))193return push_inst(compiler, NOP, UNMOVABLE_INS);194#endif /* MIPS III */195return SLJIT_SUCCESS;196}197198SLJIT_API_FUNC_ATTRIBUTE void sljit_set_jump_addr(sljit_uw addr, sljit_uw new_target, sljit_sw executable_offset)199{200sljit_ins *inst = (sljit_ins *)addr;201SLJIT_UNUSED_ARG(executable_offset);202203SLJIT_UPDATE_WX_FLAGS(inst, inst + 6, 0);204inst[0] = (inst[0] & 0xffff0000) | ((sljit_ins)(new_target >> 48) & 0xffff);205inst[1] = (inst[1] & 0xffff0000) | ((sljit_ins)(new_target >> 32) & 0xffff);206inst[3] = (inst[3] & 0xffff0000) | ((sljit_ins)(new_target >> 16) & 0xffff);207inst[5] = (inst[5] & 0xffff0000) | ((sljit_ins)new_target & 0xffff);208SLJIT_UPDATE_WX_FLAGS(inst, inst + 6, 1);209inst = (sljit_ins *)SLJIT_ADD_EXEC_OFFSET(inst, executable_offset);210SLJIT_CACHE_FLUSH(inst, inst + 6);211}212213SLJIT_API_FUNC_ATTRIBUTE void sljit_set_const(sljit_uw addr, sljit_sw new_constant, sljit_sw executable_offset)214{215sljit_set_jump_addr(addr, (sljit_uw)new_constant, executable_offset);216}217218static sljit_s32 call_with_args(struct sljit_compiler *compiler, sljit_s32 arg_types, sljit_ins *ins_ptr)219{220sljit_s32 arg_count = 0;221sljit_s32 word_arg_count = 0;222sljit_s32 float_arg_count = 0;223sljit_s32 types = 0;224sljit_ins prev_ins = *ins_ptr;225sljit_ins ins = NOP;226227SLJIT_ASSERT(reg_map[TMP_REG2] == 4 && freg_map[TMP_FREG1] == 12);228229arg_types >>= SLJIT_ARG_SHIFT;230231while (arg_types) {232types = (types << SLJIT_ARG_SHIFT) | (arg_types & SLJIT_ARG_MASK);233234switch (arg_types & SLJIT_ARG_MASK) {235case SLJIT_ARG_TYPE_F64:236case SLJIT_ARG_TYPE_F32:237arg_count++;238float_arg_count++;239break;240default:241arg_count++;242word_arg_count++;243break;244}245246arg_types >>= SLJIT_ARG_SHIFT;247}248249while (types) {250switch (types & SLJIT_ARG_MASK) {251case SLJIT_ARG_TYPE_F64:252if (arg_count != float_arg_count)253ins = MOV_fmt(FMT_D) | FS(float_arg_count) | FD(arg_count);254else if (arg_count == 1)255ins = MOV_fmt(FMT_D) | FS(SLJIT_FR0) | FD(TMP_FREG1);256arg_count--;257float_arg_count--;258break;259case SLJIT_ARG_TYPE_F32:260if (arg_count != float_arg_count)261ins = MOV_fmt(FMT_S) | FS(float_arg_count) | FD(arg_count);262else if (arg_count == 1)263ins = MOV_fmt(FMT_S) | FS(SLJIT_FR0) | FD(TMP_FREG1);264arg_count--;265float_arg_count--;266break;267default:268if (arg_count != word_arg_count)269ins = DADDU | S(word_arg_count) | TA(0) | D(arg_count);270else if (arg_count == 1)271ins = DADDU | S(SLJIT_R0) | TA(0) | DA(4);272arg_count--;273word_arg_count--;274break;275}276277if (ins != NOP) {278if (prev_ins != NOP)279FAIL_IF(push_inst(compiler, prev_ins, MOVABLE_INS));280prev_ins = ins;281ins = NOP;282}283284types >>= SLJIT_ARG_SHIFT;285}286287*ins_ptr = prev_ins;288289return SLJIT_SUCCESS;290}291292SLJIT_API_FUNC_ATTRIBUTE struct sljit_jump* sljit_emit_call(struct sljit_compiler *compiler, sljit_s32 type,293sljit_s32 arg_types)294{295struct sljit_jump *jump;296sljit_ins ins = NOP;297298CHECK_ERROR_PTR();299CHECK_PTR(check_sljit_emit_call(compiler, type, arg_types));300301jump = (struct sljit_jump*)ensure_abuf(compiler, sizeof(struct sljit_jump));302PTR_FAIL_IF(!jump);303set_jump(jump, compiler, type & SLJIT_REWRITABLE_JUMP);304305if (type & SLJIT_CALL_RETURN)306PTR_FAIL_IF(emit_stack_frame_release(compiler, 0, &ins));307308if ((type & 0xff) != SLJIT_CALL_REG_ARG)309PTR_FAIL_IF(call_with_args(compiler, arg_types, &ins));310311SLJIT_ASSERT(DR(PIC_ADDR_REG) == 25);312313if (ins == NOP && compiler->delay_slot != UNMOVABLE_INS)314jump->flags |= IS_MOVABLE;315316if (!(type & SLJIT_CALL_RETURN)) {317jump->flags |= IS_JAL;318319if ((type & 0xff) != SLJIT_CALL_REG_ARG)320jump->flags |= IS_CALL;321322PTR_FAIL_IF(push_inst(compiler, JALR | S(PIC_ADDR_REG) | DA(RETURN_ADDR_REG), UNMOVABLE_INS));323} else324PTR_FAIL_IF(push_inst(compiler, JR | S(PIC_ADDR_REG), UNMOVABLE_INS));325326jump->addr = compiler->size;327PTR_FAIL_IF(push_inst(compiler, ins, UNMOVABLE_INS));328329/* Maximum number of instructions required for generating a constant. */330compiler->size += 6;331return jump;332}333334SLJIT_API_FUNC_ATTRIBUTE sljit_s32 sljit_emit_icall(struct sljit_compiler *compiler, sljit_s32 type,335sljit_s32 arg_types,336sljit_s32 src, sljit_sw srcw)337{338sljit_ins ins = NOP;339340CHECK_ERROR();341CHECK(check_sljit_emit_icall(compiler, type, arg_types, src, srcw));342343if (src & SLJIT_MEM) {344ADJUST_LOCAL_OFFSET(src, srcw);345FAIL_IF(emit_op_mem(compiler, WORD_DATA | LOAD_DATA, DR(PIC_ADDR_REG), src, srcw));346src = PIC_ADDR_REG;347srcw = 0;348}349350if ((type & 0xff) == SLJIT_CALL_REG_ARG) {351if (type & SLJIT_CALL_RETURN) {352if (src >= SLJIT_FIRST_SAVED_REG && src <= (SLJIT_S0 - SLJIT_KEPT_SAVEDS_COUNT(compiler->options))) {353FAIL_IF(push_inst(compiler, DADDU | S(src) | TA(0) | D(PIC_ADDR_REG), DR(PIC_ADDR_REG)));354src = PIC_ADDR_REG;355srcw = 0;356}357358FAIL_IF(emit_stack_frame_release(compiler, 0, &ins));359360if (ins != NOP)361FAIL_IF(push_inst(compiler, ins, MOVABLE_INS));362}363364SLJIT_SKIP_CHECKS(compiler);365return sljit_emit_ijump(compiler, type, src, srcw);366}367368SLJIT_ASSERT(DR(PIC_ADDR_REG) == 25 && PIC_ADDR_REG == TMP_REG1);369370if (src == SLJIT_IMM)371FAIL_IF(load_immediate(compiler, DR(PIC_ADDR_REG), srcw));372else if (src != PIC_ADDR_REG)373FAIL_IF(push_inst(compiler, DADDU | S(src) | TA(0) | D(PIC_ADDR_REG), DR(PIC_ADDR_REG)));374375if (type & SLJIT_CALL_RETURN)376FAIL_IF(emit_stack_frame_release(compiler, 0, &ins));377378FAIL_IF(call_with_args(compiler, arg_types, &ins));379380/* Register input. */381if (!(type & SLJIT_CALL_RETURN))382FAIL_IF(push_inst(compiler, JALR | S(PIC_ADDR_REG) | DA(RETURN_ADDR_REG), UNMOVABLE_INS));383else384FAIL_IF(push_inst(compiler, JR | S(PIC_ADDR_REG), UNMOVABLE_INS));385return push_inst(compiler, ins, UNMOVABLE_INS);386}387388389