Path: blob/master/thirdparty/pcre2/deps/sljit/sljit_src/sljitNativePPC_64.c
9913 views
/*1* Stack-less Just-In-Time compiler2*3* Copyright Zoltan Herczeg ([email protected]). All rights reserved.4*5* Redistribution and use in source and binary forms, with or without modification, are6* permitted provided that the following conditions are met:7*8* 1. Redistributions of source code must retain the above copyright notice, this list of9* conditions and the following disclaimer.10*11* 2. Redistributions in binary form must reproduce the above copyright notice, this list12* of conditions and the following disclaimer in the documentation and/or other materials13* provided with the distribution.14*15* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDER(S) AND CONTRIBUTORS ``AS IS'' AND ANY16* EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES17* OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT18* SHALL THE COPYRIGHT HOLDER(S) OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,19* INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED20* TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR21* BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN22* CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN23* ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.24*/2526/* ppc 64-bit arch dependent functions. */2728#if defined(__GNUC__) || (defined(__IBM_GCC_ASM) && __IBM_GCC_ASM)29#define ASM_SLJIT_CLZ(src, dst) \30__asm__ volatile ( "cntlzd %0, %1" : "=r"(dst) : "r"(src) )31#elif defined(__xlc__)32#error "Please enable GCC syntax for inline assembly statements"33#else34#error "Must implement count leading zeroes"35#endif3637/* Computes SLDI(63 - shift). */38#define PUSH_SLDI_NEG(reg, shift) \39push_inst(compiler, RLDICR | S(reg) | A(reg) | RLDI_SH(63 - shift) | RLDI_ME(shift))4041static sljit_s32 load_immediate(struct sljit_compiler *compiler, sljit_s32 reg, sljit_sw imm)42{43sljit_uw tmp;44sljit_uw shift;45sljit_uw tmp2;46sljit_uw shift2;4748if (imm <= SIMM_MAX && imm >= SIMM_MIN)49return push_inst(compiler, ADDI | D(reg) | A(0) | IMM(imm));5051if (((sljit_uw)imm >> 16) == 0)52return push_inst(compiler, ORI | S(TMP_ZERO) | A(reg) | IMM(imm));5354if (imm <= 0x7fffffffl && imm >= -0x80000000l) {55FAIL_IF(push_inst(compiler, ADDIS | D(reg) | A(0) | IMM(imm >> 16)));56return (imm & 0xffff) ? push_inst(compiler, ORI | S(reg) | A(reg) | IMM(imm)) : SLJIT_SUCCESS;57}5859if (((sljit_uw)imm >> 32) == 0) {60FAIL_IF(push_inst(compiler, ORIS | S(TMP_ZERO) | A(reg) | IMM(imm >> 16)));61return (imm & 0xffff) ? push_inst(compiler, ORI | S(reg) | A(reg) | IMM(imm)) : SLJIT_SUCCESS;62}6364/* Count leading zeroes. */65tmp = (sljit_uw)((imm >= 0) ? imm : ~imm);66ASM_SLJIT_CLZ(tmp, shift);67SLJIT_ASSERT(shift > 0);68shift--;69tmp = ((sljit_uw)imm << shift);7071if ((tmp & ~0xffff000000000000ul) == 0) {72FAIL_IF(push_inst(compiler, ADDI | D(reg) | A(0) | (sljit_ins)(tmp >> 48)));73shift += 15;74return PUSH_SLDI_NEG(reg, shift);75}7677if ((tmp & ~0xffffffff00000000ul) == 0) {78FAIL_IF(push_inst(compiler, ADDIS | D(reg) | A(0) | (sljit_ins)(tmp >> 48)));79FAIL_IF(push_inst(compiler, ORI | S(reg) | A(reg) | IMM(tmp >> 32)));80shift += 31;81return PUSH_SLDI_NEG(reg, shift);82}8384/* Cut out the 16 bit from immediate. */85shift += 15;86tmp2 = (sljit_uw)imm & (((sljit_uw)1 << (63 - shift)) - 1);8788if (tmp2 <= 0xffff) {89FAIL_IF(push_inst(compiler, ADDI | D(reg) | A(0) | (sljit_ins)(tmp >> 48)));90FAIL_IF(PUSH_SLDI_NEG(reg, shift));91return push_inst(compiler, ORI | S(reg) | A(reg) | (sljit_ins)tmp2);92}9394if (tmp2 <= 0xffffffff) {95FAIL_IF(push_inst(compiler, ADDI | D(reg) | A(0) | IMM(tmp >> 48)));96FAIL_IF(PUSH_SLDI_NEG(reg, shift));97FAIL_IF(push_inst(compiler, ORIS | S(reg) | A(reg) | (sljit_ins)(tmp2 >> 16)));98return (imm & 0xffff) ? push_inst(compiler, ORI | S(reg) | A(reg) | IMM(tmp2)) : SLJIT_SUCCESS;99}100101ASM_SLJIT_CLZ(tmp2, shift2);102tmp2 <<= shift2;103104if ((tmp2 & ~0xffff000000000000ul) == 0) {105FAIL_IF(push_inst(compiler, ADDI | D(reg) | A(0) | (sljit_ins)(tmp >> 48)));106shift2 += 15;107shift += (63 - shift2);108FAIL_IF(PUSH_SLDI_NEG(reg, shift));109FAIL_IF(push_inst(compiler, ORI | S(reg) | A(reg) | (sljit_ins)(tmp2 >> 48)));110return PUSH_SLDI_NEG(reg, shift2);111}112113/* The general version. */114FAIL_IF(push_inst(compiler, ADDIS | D(reg) | A(0) | (sljit_ins)((sljit_uw)imm >> 48)));115FAIL_IF(push_inst(compiler, ORI | S(reg) | A(reg) | IMM(imm >> 32)));116FAIL_IF(PUSH_SLDI_NEG(reg, 31));117FAIL_IF(push_inst(compiler, ORIS | S(reg) | A(reg) | IMM(imm >> 16)));118return push_inst(compiler, ORI | S(reg) | A(reg) | IMM(imm));119}120121#undef PUSH_SLDI_NEG122123#define CLRLDI(dst, src, n) \124(RLDICL | S(src) | A(dst) | RLDI_SH(0) | RLDI_MB(n))125126/* Sign extension for integer operations. */127#define UN_EXTS() \128if ((flags & (ALT_SIGN_EXT | REG2_SOURCE)) == (ALT_SIGN_EXT | REG2_SOURCE)) { \129FAIL_IF(push_inst(compiler, EXTSW | S(src2) | A(TMP_REG2))); \130src2 = TMP_REG2; \131}132133#define BIN_EXTS() \134if (flags & ALT_SIGN_EXT) { \135if (flags & REG1_SOURCE) { \136FAIL_IF(push_inst(compiler, EXTSW | S(src1) | A(TMP_REG1))); \137src1 = TMP_REG1; \138} \139if (flags & REG2_SOURCE) { \140FAIL_IF(push_inst(compiler, EXTSW | S(src2) | A(TMP_REG2))); \141src2 = TMP_REG2; \142} \143}144145#define BIN_IMM_EXTS() \146if ((flags & (ALT_SIGN_EXT | REG1_SOURCE)) == (ALT_SIGN_EXT | REG1_SOURCE)) { \147FAIL_IF(push_inst(compiler, EXTSW | S(src1) | A(TMP_REG1))); \148src1 = TMP_REG1; \149}150151static SLJIT_INLINE sljit_s32 emit_single_op(struct sljit_compiler *compiler, sljit_s32 op, sljit_s32 flags,152sljit_s32 dst, sljit_s32 src1, sljit_s32 src2)153{154sljit_u32 imm;155156switch (op) {157case SLJIT_MOV:158case SLJIT_MOV_P:159SLJIT_ASSERT(src1 == TMP_REG1);160if (dst != src2)161return push_inst(compiler, OR | S(src2) | A(dst) | B(src2));162return SLJIT_SUCCESS;163164case SLJIT_MOV_U32:165case SLJIT_MOV_S32:166SLJIT_ASSERT(src1 == TMP_REG1);167if ((flags & (REG_DEST | REG2_SOURCE)) == (REG_DEST | REG2_SOURCE)) {168if (op == SLJIT_MOV_S32)169return push_inst(compiler, EXTSW | S(src2) | A(dst));170return push_inst(compiler, CLRLDI(dst, src2, 32));171}172else {173SLJIT_ASSERT(dst == src2);174}175return SLJIT_SUCCESS;176177case SLJIT_MOV_U8:178case SLJIT_MOV_S8:179SLJIT_ASSERT(src1 == TMP_REG1);180if ((flags & (REG_DEST | REG2_SOURCE)) == (REG_DEST | REG2_SOURCE)) {181if (op == SLJIT_MOV_S8)182return push_inst(compiler, EXTSB | S(src2) | A(dst));183return push_inst(compiler, CLRLDI(dst, src2, 56));184}185else if ((flags & REG_DEST) && op == SLJIT_MOV_S8)186return push_inst(compiler, EXTSB | S(src2) | A(dst));187else {188SLJIT_ASSERT(dst == src2);189}190return SLJIT_SUCCESS;191192case SLJIT_MOV_U16:193case SLJIT_MOV_S16:194SLJIT_ASSERT(src1 == TMP_REG1);195if ((flags & (REG_DEST | REG2_SOURCE)) == (REG_DEST | REG2_SOURCE)) {196if (op == SLJIT_MOV_S16)197return push_inst(compiler, EXTSH | S(src2) | A(dst));198return push_inst(compiler, CLRLDI(dst, src2, 48));199}200else {201SLJIT_ASSERT(dst == src2);202}203return SLJIT_SUCCESS;204205case SLJIT_CLZ:206SLJIT_ASSERT(src1 == TMP_REG1);207return push_inst(compiler, ((flags & ALT_FORM1) ? CNTLZW : CNTLZD) | S(src2) | A(dst));208209case SLJIT_CTZ:210SLJIT_ASSERT(src1 == TMP_REG1);211FAIL_IF(push_inst(compiler, NEG | D(TMP_REG1) | A(src2)));212FAIL_IF(push_inst(compiler, AND | S(src2) | A(dst) | B(TMP_REG1)));213FAIL_IF(push_inst(compiler, ((flags & ALT_FORM1) ? CNTLZW : CNTLZD) | S(dst) | A(dst)));214FAIL_IF(push_inst(compiler, ADDI | D(TMP_REG1) | A(dst) | IMM((flags & ALT_FORM1) ? -32 : -64)));215/* The highest bits are set, if dst < bit width, zero otherwise. */216FAIL_IF(push_inst(compiler, ((flags & ALT_FORM1) ? SRWI(27) : SRDI(58)) | S(TMP_REG1) | A(TMP_REG1)));217return push_inst(compiler, XOR | S(dst) | A(dst) | B(TMP_REG1));218219case SLJIT_ADD:220if (flags & ALT_FORM1) {221if (flags & ALT_SIGN_EXT) {222FAIL_IF(push_inst(compiler, SLDI(32) | S(src1) | A(TMP_REG1)));223src1 = TMP_REG1;224FAIL_IF(push_inst(compiler, SLDI(32) | S(src2) | A(TMP_REG2)));225src2 = TMP_REG2;226}227/* Setting XER SO is not enough, CR SO is also needed. */228FAIL_IF(push_inst(compiler, ADD | OE(ALT_SET_FLAGS) | RC(ALT_SET_FLAGS) | D(dst) | A(src1) | B(src2)));229if (flags & ALT_SIGN_EXT)230return push_inst(compiler, SRDI(32) | S(dst) | A(dst));231return SLJIT_SUCCESS;232}233234if (flags & ALT_FORM2) {235/* Flags does not set: BIN_IMM_EXTS unnecessary. */236SLJIT_ASSERT(src2 == TMP_REG2);237238if (flags & ALT_FORM3)239return push_inst(compiler, ADDIS | D(dst) | A(src1) | compiler->imm);240241imm = compiler->imm;242243if (flags & ALT_FORM4) {244FAIL_IF(push_inst(compiler, ADDIS | D(dst) | A(src1) | (((imm >> 16) & 0xffff) + ((imm >> 15) & 0x1))));245src1 = dst;246}247248return push_inst(compiler, ADDI | D(dst) | A(src1) | (imm & 0xffff));249}250if (flags & ALT_FORM3) {251SLJIT_ASSERT(src2 == TMP_REG2);252BIN_IMM_EXTS();253return push_inst(compiler, ADDIC | D(dst) | A(src1) | compiler->imm);254}255if (flags & ALT_FORM4) {256if (flags & ALT_FORM5)257FAIL_IF(push_inst(compiler, ADDI | D(dst) | A(src1) | compiler->imm));258else259FAIL_IF(push_inst(compiler, ADD | D(dst) | A(src1) | B(src2)));260return push_inst(compiler, CMPI | A(dst) | 0);261}262if (!(flags & ALT_SET_FLAGS))263return push_inst(compiler, ADD | D(dst) | A(src1) | B(src2));264BIN_EXTS();265if (flags & ALT_FORM5)266return push_inst(compiler, ADDC | RC(ALT_SET_FLAGS) | D(dst) | A(src1) | B(src2));267return push_inst(compiler, ADD | RC(flags) | D(dst) | A(src1) | B(src2));268269case SLJIT_ADDC:270BIN_EXTS();271return push_inst(compiler, ADDE | D(dst) | A(src1) | B(src2));272273case SLJIT_SUB:274if (flags & ALT_FORM1) {275if (flags & ALT_FORM2) {276FAIL_IF(push_inst(compiler, CMPLI | CRD(0 | ((flags & ALT_SIGN_EXT) ? 0 : 1)) | A(src1) | compiler->imm));277if (!(flags & ALT_FORM3))278return SLJIT_SUCCESS;279return push_inst(compiler, ADDI | D(dst) | A(src1) | (-compiler->imm & 0xffff));280}281FAIL_IF(push_inst(compiler, CMPL | CRD(0 | ((flags & ALT_SIGN_EXT) ? 0 : 1)) | A(src1) | B(src2)));282if (!(flags & ALT_FORM3))283return SLJIT_SUCCESS;284return push_inst(compiler, SUBF | D(dst) | A(src2) | B(src1));285}286287if (flags & ALT_FORM2) {288if (flags & ALT_FORM3) {289FAIL_IF(push_inst(compiler, CMPI | CRD(0 | ((flags & ALT_SIGN_EXT) ? 0 : 1)) | A(src1) | compiler->imm));290if (!(flags & ALT_FORM4))291return SLJIT_SUCCESS;292return push_inst(compiler, ADDI | D(dst) | A(src1) | (-compiler->imm & 0xffff));293}294FAIL_IF(push_inst(compiler, CMP | CRD(0 | ((flags & ALT_SIGN_EXT) ? 0 : 1)) | A(src1) | B(src2)));295if (!(flags & ALT_FORM4))296return SLJIT_SUCCESS;297return push_inst(compiler, SUBF | D(dst) | A(src2) | B(src1));298}299300if (flags & ALT_FORM3) {301if (flags & ALT_SIGN_EXT) {302if (src1 != TMP_ZERO) {303FAIL_IF(push_inst(compiler, SLDI(32) | S(src1) | A(TMP_REG1)));304src1 = TMP_REG1;305}306if (src2 != TMP_ZERO) {307FAIL_IF(push_inst(compiler, SLDI(32) | S(src2) | A(TMP_REG2)));308src2 = TMP_REG2;309}310}311312/* Setting XER SO is not enough, CR SO is also needed. */313if (src1 != TMP_ZERO)314FAIL_IF(push_inst(compiler, SUBF | OE(ALT_SET_FLAGS) | RC(ALT_SET_FLAGS) | D(dst) | A(src2) | B(src1)));315else316FAIL_IF(push_inst(compiler, NEG | OE(ALT_SET_FLAGS) | RC(ALT_SET_FLAGS) | D(dst) | A(src2)));317318if (flags & ALT_SIGN_EXT)319return push_inst(compiler, SRDI(32) | S(dst) | A(dst));320return SLJIT_SUCCESS;321}322323if (flags & ALT_FORM4) {324/* Flags does not set: BIN_IMM_EXTS unnecessary. */325SLJIT_ASSERT(src2 == TMP_REG2);326return push_inst(compiler, SUBFIC | D(dst) | A(src1) | compiler->imm);327}328329if (!(flags & ALT_SET_FLAGS)) {330SLJIT_ASSERT(src1 != TMP_ZERO);331return push_inst(compiler, SUBF | D(dst) | A(src2) | B(src1));332}333334BIN_EXTS();335if (flags & ALT_FORM5)336return push_inst(compiler, SUBFC | RC(ALT_SET_FLAGS) | D(dst) | A(src2) | B(src1));337338if (src1 != TMP_ZERO)339return push_inst(compiler, SUBF | RC(ALT_SET_FLAGS) | D(dst) | A(src2) | B(src1));340return push_inst(compiler, NEG | RC(ALT_SET_FLAGS) | D(dst) | A(src2));341342case SLJIT_SUBC:343BIN_EXTS();344return push_inst(compiler, SUBFE | D(dst) | A(src2) | B(src1));345346case SLJIT_MUL:347if (flags & ALT_FORM1) {348SLJIT_ASSERT(src2 == TMP_REG2);349return push_inst(compiler, MULLI | D(dst) | A(src1) | compiler->imm);350}351BIN_EXTS();352if (flags & ALT_FORM2)353return push_inst(compiler, MULLW | OE(flags) | RC(flags) | D(dst) | A(src2) | B(src1));354return push_inst(compiler, MULLD | OE(flags) | RC(flags) | D(dst) | A(src2) | B(src1));355356case SLJIT_AND:357if (flags & ALT_FORM1) {358SLJIT_ASSERT(src2 == TMP_REG2);359return push_inst(compiler, ANDI | S(src1) | A(dst) | compiler->imm);360}361if (flags & ALT_FORM2) {362SLJIT_ASSERT(src2 == TMP_REG2);363return push_inst(compiler, ANDIS | S(src1) | A(dst) | compiler->imm);364}365return push_inst(compiler, AND | RC(flags) | S(src1) | A(dst) | B(src2));366367case SLJIT_OR:368if (flags & ALT_FORM1) {369SLJIT_ASSERT(src2 == TMP_REG2);370return push_inst(compiler, ORI | S(src1) | A(dst) | compiler->imm);371}372if (flags & ALT_FORM2) {373SLJIT_ASSERT(src2 == TMP_REG2);374return push_inst(compiler, ORIS | S(src1) | A(dst) | compiler->imm);375}376if (flags & ALT_FORM3) {377SLJIT_ASSERT(src2 == TMP_REG2);378imm = compiler->imm;379380FAIL_IF(push_inst(compiler, ORI | S(src1) | A(dst) | IMM(imm)));381return push_inst(compiler, ORIS | S(dst) | A(dst) | IMM(imm >> 16));382}383return push_inst(compiler, OR | RC(flags) | S(src1) | A(dst) | B(src2));384385case SLJIT_XOR:386if (flags & ALT_FORM1) {387SLJIT_ASSERT(src2 == TMP_REG2);388return push_inst(compiler, XORI | S(src1) | A(dst) | compiler->imm);389}390if (flags & ALT_FORM2) {391SLJIT_ASSERT(src2 == TMP_REG2);392return push_inst(compiler, XORIS | S(src1) | A(dst) | compiler->imm);393}394if (flags & ALT_FORM3) {395SLJIT_ASSERT(src2 == TMP_REG2);396imm = compiler->imm;397398FAIL_IF(push_inst(compiler, XORI | S(src1) | A(dst) | IMM(imm)));399return push_inst(compiler, XORIS | S(dst) | A(dst) | IMM(imm >> 16));400}401if (flags & ALT_FORM4) {402SLJIT_ASSERT(src1 == TMP_REG1);403UN_EXTS();404return push_inst(compiler, NOR | RC(flags) | S(src2) | A(dst) | B(src2));405}406return push_inst(compiler, XOR | RC(flags) | S(src1) | A(dst) | B(src2));407408case SLJIT_SHL:409case SLJIT_MSHL:410if (flags & ALT_FORM1) {411SLJIT_ASSERT(src2 == TMP_REG2);412imm = compiler->imm;413414if (flags & ALT_FORM2) {415imm &= 0x1f;416return push_inst(compiler, SLWI(imm) | RC(flags) | S(src1) | A(dst));417}418419imm &= 0x3f;420return push_inst(compiler, SLDI(imm) | RC(flags) | S(src1) | A(dst));421}422423if (op == SLJIT_MSHL) {424FAIL_IF(push_inst(compiler, ANDI | S(src2) | A(TMP_REG2) | ((flags & ALT_FORM2) ? 0x1f : 0x3f)));425src2 = TMP_REG2;426}427428return push_inst(compiler, ((flags & ALT_FORM2) ? SLW : SLD) | RC(flags) | S(src1) | A(dst) | B(src2));429430case SLJIT_LSHR:431case SLJIT_MLSHR:432if (flags & ALT_FORM1) {433SLJIT_ASSERT(src2 == TMP_REG2);434imm = compiler->imm;435436if (flags & ALT_FORM2) {437imm &= 0x1f;438/* Since imm can be 0, SRWI() cannot be used. */439return push_inst(compiler, RLWINM | RC(flags) | S(src1) | A(dst) | RLWI_SH((32 - imm) & 0x1f) | RLWI_MBE(imm, 31));440}441442imm &= 0x3f;443/* Since imm can be 0, SRDI() cannot be used. */444return push_inst(compiler, RLDICL | RC(flags) | S(src1) | A(dst) | RLDI_SH((64 - imm) & 0x3f) | RLDI_MB(imm));445}446447if (op == SLJIT_MLSHR) {448FAIL_IF(push_inst(compiler, ANDI | S(src2) | A(TMP_REG2) | ((flags & ALT_FORM2) ? 0x1f : 0x3f)));449src2 = TMP_REG2;450}451452return push_inst(compiler, ((flags & ALT_FORM2) ? SRW : SRD) | RC(flags) | S(src1) | A(dst) | B(src2));453454case SLJIT_ASHR:455case SLJIT_MASHR:456if (flags & ALT_FORM1) {457SLJIT_ASSERT(src2 == TMP_REG2);458imm = compiler->imm;459460if (flags & ALT_FORM2) {461imm &= 0x1f;462return push_inst(compiler, SRAWI | RC(flags) | S(src1) | A(dst) | (imm << 11));463}464465imm &= 0x3f;466return push_inst(compiler, SRADI | RC(flags) | S(src1) | A(dst) | RLDI_SH(imm));467}468469if (op == SLJIT_MASHR) {470FAIL_IF(push_inst(compiler, ANDI | S(src2) | A(TMP_REG2) | ((flags & ALT_FORM2) ? 0x1f : 0x3f)));471src2 = TMP_REG2;472}473474return push_inst(compiler, ((flags & ALT_FORM2) ? SRAW : SRAD) | RC(flags) | S(src1) | A(dst) | B(src2));475476case SLJIT_ROTL:477case SLJIT_ROTR:478if (flags & ALT_FORM1) {479SLJIT_ASSERT(src2 == TMP_REG2);480imm = compiler->imm;481482if (op == SLJIT_ROTR)483imm = (sljit_u32)(-(sljit_s32)imm);484485if (flags & ALT_FORM2) {486imm &= 0x1f;487return push_inst(compiler, RLWINM | S(src1) | A(dst) | RLWI_SH(imm) | RLWI_MBE(0, 31));488}489490imm &= 0x3f;491return push_inst(compiler, RLDICL | S(src1) | A(dst) | RLDI_SH(imm));492}493494if (op == SLJIT_ROTR) {495FAIL_IF(push_inst(compiler, SUBFIC | D(TMP_REG2) | A(src2) | 0));496src2 = TMP_REG2;497}498499return push_inst(compiler, ((flags & ALT_FORM2) ? (RLWNM | RLWI_MBE(0, 31)) : (RLDCL | RLDI_MB(0))) | S(src1) | A(dst) | B(src2));500}501502SLJIT_UNREACHABLE();503return SLJIT_SUCCESS;504}505506static sljit_s32 call_with_args(struct sljit_compiler *compiler, sljit_s32 arg_types, sljit_s32 *src)507{508sljit_s32 arg_count = 0;509sljit_s32 word_arg_count = 0;510sljit_s32 types = 0;511sljit_s32 reg = 0;512513if (src)514reg = *src & REG_MASK;515516arg_types >>= SLJIT_ARG_SHIFT;517518while (arg_types) {519types = (types << SLJIT_ARG_SHIFT) | (arg_types & SLJIT_ARG_MASK);520521switch (arg_types & SLJIT_ARG_MASK) {522case SLJIT_ARG_TYPE_F64:523case SLJIT_ARG_TYPE_F32:524arg_count++;525break;526default:527arg_count++;528word_arg_count++;529530if (arg_count != word_arg_count && arg_count == reg) {531FAIL_IF(push_inst(compiler, OR | S(reg) | A(TMP_CALL_REG) | B(reg)));532*src = TMP_CALL_REG;533}534break;535}536537arg_types >>= SLJIT_ARG_SHIFT;538}539540while (types) {541switch (types & SLJIT_ARG_MASK) {542case SLJIT_ARG_TYPE_F64:543case SLJIT_ARG_TYPE_F32:544arg_count--;545break;546default:547if (arg_count != word_arg_count)548FAIL_IF(push_inst(compiler, OR | S(word_arg_count) | A(arg_count) | B(word_arg_count)));549550arg_count--;551word_arg_count--;552break;553}554555types >>= SLJIT_ARG_SHIFT;556}557558return SLJIT_SUCCESS;559}560561static SLJIT_INLINE sljit_s32 emit_const(struct sljit_compiler *compiler, sljit_s32 reg, sljit_sw init_value)562{563FAIL_IF(push_inst(compiler, ADDIS | D(reg) | A(0) | IMM(init_value >> 48)));564FAIL_IF(push_inst(compiler, ORI | S(reg) | A(reg) | IMM(init_value >> 32)));565FAIL_IF(push_inst(compiler, SLDI(32) | S(reg) | A(reg)));566FAIL_IF(push_inst(compiler, ORIS | S(reg) | A(reg) | IMM(init_value >> 16)));567return push_inst(compiler, ORI | S(reg) | A(reg) | IMM(init_value));568}569570static SLJIT_INLINE sljit_s32 sljit_emit_fop1_conv_f64_from_sw(struct sljit_compiler *compiler, sljit_s32 op,571sljit_s32 dst, sljit_sw dstw,572sljit_s32 src, sljit_sw srcw)573{574sljit_s32 dst_r = FAST_IS_REG(dst) ? dst : TMP_FREG1;575576if (src == SLJIT_IMM) {577if (GET_OPCODE(op) == SLJIT_CONV_F64_FROM_S32)578srcw = (sljit_s32)srcw;579580FAIL_IF(load_immediate(compiler, TMP_REG1, srcw));581src = TMP_REG1;582} else if (GET_OPCODE(op) == SLJIT_CONV_F64_FROM_S32) {583if (FAST_IS_REG(src))584FAIL_IF(push_inst(compiler, EXTSW | S(src) | A(TMP_REG1)));585else586FAIL_IF(emit_op_mem(compiler, INT_DATA | SIGNED_DATA | LOAD_DATA, TMP_REG1, src, srcw, TMP_REG1));587src = TMP_REG1;588}589590if (FAST_IS_REG(src)) {591FAIL_IF(push_inst(compiler, STD | S(src) | A(SLJIT_SP) | TMP_MEM_OFFSET));592FAIL_IF(push_inst(compiler, LFD | FS(TMP_FREG1) | A(SLJIT_SP) | TMP_MEM_OFFSET));593} else594FAIL_IF(emit_op_mem(compiler, DOUBLE_DATA | LOAD_DATA, TMP_FREG1, src, srcw, TMP_REG1));595596FAIL_IF(push_inst(compiler, FCFID | FD(dst_r) | FB(TMP_FREG1)));597598if (op & SLJIT_32)599FAIL_IF(push_inst(compiler, FRSP | FD(dst_r) | FB(dst_r)));600601if (dst & SLJIT_MEM)602return emit_op_mem(compiler, FLOAT_DATA(op), TMP_FREG1, dst, dstw, TMP_REG1);603return SLJIT_SUCCESS;604}605606static SLJIT_INLINE sljit_s32 sljit_emit_fop1_conv_f64_from_uw(struct sljit_compiler *compiler, sljit_s32 op,607sljit_s32 dst, sljit_sw dstw,608sljit_s32 src, sljit_sw srcw)609{610sljit_s32 dst_r = FAST_IS_REG(dst) ? dst : TMP_FREG1;611612if (GET_OPCODE(op) == SLJIT_CONV_F64_FROM_U32) {613if (src == SLJIT_IMM) {614FAIL_IF(load_immediate(compiler, TMP_REG1, (sljit_u32)srcw));615src = TMP_REG1;616} else {617if (FAST_IS_REG(src))618FAIL_IF(push_inst(compiler, CLRLDI(TMP_REG1, src, 32)));619else620FAIL_IF(emit_op_mem(compiler, INT_DATA | LOAD_DATA, TMP_REG1, src, srcw, TMP_REG1));621src = TMP_REG1;622}623624FAIL_IF(push_inst(compiler, STD | S(src) | A(SLJIT_SP) | TMP_MEM_OFFSET));625FAIL_IF(push_inst(compiler, LFD | FS(TMP_FREG1) | A(SLJIT_SP) | TMP_MEM_OFFSET));626FAIL_IF(push_inst(compiler, FCFID | FD(dst_r) | FB(TMP_FREG1)));627} else {628if (src == SLJIT_IMM) {629FAIL_IF(load_immediate(compiler, TMP_REG1, srcw));630src = TMP_REG1;631} else if (src & SLJIT_MEM) {632FAIL_IF(emit_op_mem(compiler, WORD_DATA | LOAD_DATA, TMP_REG1, src, srcw, TMP_REG1));633src = TMP_REG1;634}635636FAIL_IF(push_inst(compiler, CMPI | CRD(0 | 1) | A(src) | 0));637FAIL_IF(push_inst(compiler, BCx | (12 << 21) | (0 << 16) | 20));638FAIL_IF(push_inst(compiler, STD | S(src) | A(SLJIT_SP) | TMP_MEM_OFFSET));639FAIL_IF(push_inst(compiler, LFD | FS(TMP_FREG1) | A(SLJIT_SP) | TMP_MEM_OFFSET));640FAIL_IF(push_inst(compiler, FCFID | FD(dst_r) | FB(TMP_FREG1)));641FAIL_IF(push_inst(compiler, Bx | ((op & SLJIT_32) ? 36 : 32)));642643if (op & SLJIT_32)644FAIL_IF(push_inst(compiler, RLWINM | S(src) | A(TMP_REG2) | RLWI_SH(10) | RLWI_MBE(10, 21)));645else646FAIL_IF(push_inst(compiler, ANDI | S(src) | A(TMP_REG2) | 0x1));647648/* Shift right. */649FAIL_IF(push_inst(compiler, RLDICL | S(src) | A(TMP_REG1) | RLDI_SH(63) | RLDI_MB(1)));650651if (op & SLJIT_32)652FAIL_IF(push_inst(compiler, RLDICR | S(TMP_REG1) | A(TMP_REG1) | RLDI_SH(0) | RLDI_ME(53)));653654FAIL_IF(push_inst(compiler, OR | S(TMP_REG1) | A(TMP_REG1) | B(TMP_REG2)));655656FAIL_IF(push_inst(compiler, STD | S(TMP_REG1) | A(SLJIT_SP) | TMP_MEM_OFFSET));657FAIL_IF(push_inst(compiler, LFD | FS(TMP_FREG1) | A(SLJIT_SP) | TMP_MEM_OFFSET));658FAIL_IF(push_inst(compiler, FCFID | FD(dst_r) | FB(TMP_FREG1)));659FAIL_IF(push_inst(compiler, FADD | FD(dst_r) | FA(dst_r) | FB(dst_r)));660}661662if (op & SLJIT_32)663FAIL_IF(push_inst(compiler, FRSP | FD(dst_r) | FB(dst_r)));664665if (dst & SLJIT_MEM)666return emit_op_mem(compiler, FLOAT_DATA(op), TMP_FREG1, dst, dstw, TMP_REG1);667return SLJIT_SUCCESS;668}669670SLJIT_API_FUNC_ATTRIBUTE sljit_s32 sljit_emit_fset64(struct sljit_compiler *compiler,671sljit_s32 freg, sljit_f64 value)672{673union {674sljit_sw imm;675sljit_f64 value;676} u;677678CHECK_ERROR();679CHECK(check_sljit_emit_fset64(compiler, freg, value));680681u.value = value;682683if (u.imm != 0)684FAIL_IF(load_immediate(compiler, TMP_REG1, u.imm));685686FAIL_IF(push_inst(compiler, STD | S(u.imm != 0 ? TMP_REG1 : TMP_ZERO) | A(SLJIT_SP) | TMP_MEM_OFFSET));687return push_inst(compiler, LFD | FS(freg) | A(SLJIT_SP) | TMP_MEM_OFFSET);688}689690SLJIT_API_FUNC_ATTRIBUTE sljit_s32 sljit_emit_fcopy(struct sljit_compiler *compiler, sljit_s32 op,691sljit_s32 freg, sljit_s32 reg)692{693CHECK_ERROR();694CHECK(check_sljit_emit_fcopy(compiler, op, freg, reg));695696if (GET_OPCODE(op) == SLJIT_COPY_TO_F64) {697FAIL_IF(push_inst(compiler, ((op & SLJIT_32) ? STW : STD) | S(reg) | A(SLJIT_SP) | TMP_MEM_OFFSET));698return push_inst(compiler, ((op & SLJIT_32) ? LFS : LFD) | FS(freg) | A(SLJIT_SP) | TMP_MEM_OFFSET);699}700701FAIL_IF(push_inst(compiler, ((op & SLJIT_32) ? STFS : STFD) | FS(freg) | A(SLJIT_SP) | TMP_MEM_OFFSET));702return push_inst(compiler, ((op & SLJIT_32) ? LWZ : LD) | S(reg) | A(SLJIT_SP) | TMP_MEM_OFFSET);703}704705SLJIT_API_FUNC_ATTRIBUTE void sljit_set_jump_addr(sljit_uw addr, sljit_uw new_target, sljit_sw executable_offset)706{707sljit_ins *inst = (sljit_ins*)addr;708SLJIT_UNUSED_ARG(executable_offset);709710SLJIT_UPDATE_WX_FLAGS(inst, inst + 5, 0);711inst[0] = (inst[0] & 0xffff0000u) | ((sljit_ins)(new_target >> 48) & 0xffff);712inst[1] = (inst[1] & 0xffff0000u) | ((sljit_ins)(new_target >> 32) & 0xffff);713inst[3] = (inst[3] & 0xffff0000u) | ((sljit_ins)(new_target >> 16) & 0xffff);714inst[4] = (inst[4] & 0xffff0000u) | ((sljit_ins)new_target & 0xffff);715SLJIT_UPDATE_WX_FLAGS(inst, inst + 5, 1);716inst = (sljit_ins *)SLJIT_ADD_EXEC_OFFSET(inst, executable_offset);717SLJIT_CACHE_FLUSH(inst, inst + 5);718}719720721