Path: blob/21.2-virgl/src/gallium/drivers/nouveau/codegen/nv50_ir_lowering_helper.cpp
4574 views
/*1* Copyright 2018 Red Hat Inc.2*3* Permission is hereby granted, free of charge, to any person obtaining a4* copy of this software and associated documentation files (the "Software"),5* to deal in the Software without restriction, including without limitation6* the rights to use, copy, modify, merge, publish, distribute, sublicense,7* and/or sell copies of the Software, and to permit persons to whom the8* Software is furnished to do so, subject to the following conditions:9*10* The above copyright notice and this permission notice shall be included in11* all copies or substantial portions of the Software.12*13* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR14* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,15* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL16* THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR17* OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,18* ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR19* OTHER DEALINGS IN THE SOFTWARE.20*21* Authors: Karol Herbst <[email protected]>22*/2324#include "codegen/nv50_ir_lowering_helper.h"2526namespace nv50_ir {2728bool29LoweringHelper::visit(Instruction *insn)30{31switch (insn->op) {32case OP_ABS:33return handleABS(insn);34case OP_CVT:35return handleCVT(insn);36case OP_MAX:37case OP_MIN:38return handleMAXMIN(insn);39case OP_MOV:40return handleMOV(insn);41case OP_NEG:42return handleNEG(insn);43case OP_SAT:44return handleSAT(insn);45case OP_SLCT:46return handleSLCT(insn->asCmp());47case OP_AND:48case OP_NOT:49case OP_OR:50case OP_XOR:51return handleLogOp(insn);52default:53return true;54}55}5657bool58LoweringHelper::handleABS(Instruction *insn)59{60DataType dTy = insn->dType;61if (!(dTy == TYPE_U64 || dTy == TYPE_S64))62return true;6364bld.setPosition(insn, false);6566Value *neg = bld.getSSA(8);67Value *negComp[2], *srcComp[2];68Value *lo = bld.getSSA(), *hi = bld.getSSA();69bld.mkOp2(OP_SUB, dTy, neg, bld.mkImm((uint64_t)0), insn->getSrc(0));70bld.mkSplit(negComp, 4, neg);71bld.mkSplit(srcComp, 4, insn->getSrc(0));72bld.mkCmp(OP_SLCT, CC_LT, TYPE_S32, lo, TYPE_S32, negComp[0], srcComp[0], srcComp[1]);73bld.mkCmp(OP_SLCT, CC_LT, TYPE_S32, hi, TYPE_S32, negComp[1], srcComp[1], srcComp[1]);74insn->op = OP_MERGE;75insn->setSrc(0, lo);76insn->setSrc(1, hi);7778return true;79}8081bool82LoweringHelper::handleCVT(Instruction *insn)83{84DataType dTy = insn->dType;85DataType sTy = insn->sType;8687if (typeSizeof(dTy) <= 4 && typeSizeof(sTy) <= 4)88return true;8990bld.setPosition(insn, false);9192if ((dTy == TYPE_S32 && sTy == TYPE_S64) ||93(dTy == TYPE_U32 && sTy == TYPE_U64)) {94Value *src[2];95bld.mkSplit(src, 4, insn->getSrc(0));96insn->op = OP_MOV;97insn->setSrc(0, src[0]);98} else if (dTy == TYPE_S64 && sTy == TYPE_S32) {99Value *tmp = bld.getSSA();100bld.mkOp2(OP_SHR, TYPE_S32, tmp, insn->getSrc(0), bld.loadImm(bld.getSSA(), 31));101insn->op = OP_MERGE;102insn->setSrc(1, tmp);103} else if (dTy == TYPE_U64 && sTy == TYPE_U32) {104insn->op = OP_MERGE;105insn->setSrc(1, bld.loadImm(bld.getSSA(), 0));106}107108return true;109}110111bool112LoweringHelper::handleMAXMIN(Instruction *insn)113{114DataType dTy = insn->dType;115if (!(dTy == TYPE_U64 || dTy == TYPE_S64))116return true;117118DataType sTy = typeOfSize(4, false, isSignedIntType(dTy));119bld.setPosition(insn, false);120121Value *flag = bld.getSSA(1, FILE_FLAGS);122Value *src0[2];123Value *src1[2];124Value *def[2];125126bld.mkSplit(src0, 4, insn->getSrc(0));127bld.mkSplit(src1, 4, insn->getSrc(1));128129def[0] = bld.getSSA();130def[1] = bld.getSSA();131132Instruction *hi = bld.mkOp2(insn->op, sTy, def[1], src0[1], src1[1]);133hi->subOp = NV50_IR_SUBOP_MINMAX_HIGH;134hi->setFlagsDef(1, flag);135136Instruction *lo = bld.mkOp2(insn->op, sTy, def[0], src0[0], src1[0]);137lo->subOp = NV50_IR_SUBOP_MINMAX_LOW;138lo->setFlagsSrc(2, flag);139140insn->op = OP_MERGE;141insn->setSrc(0, def[0]);142insn->setSrc(1, def[1]);143144return true;145}146147bool148LoweringHelper::handleMOV(Instruction *insn)149{150DataType dTy = insn->dType;151152if (typeSizeof(dTy) != 8)153return true;154155Storage ® = insn->getSrc(0)->reg;156157if (reg.file != FILE_IMMEDIATE)158return true;159160bld.setPosition(insn, false);161162Value *hi = bld.getSSA();163Value *lo = bld.getSSA();164165bld.loadImm(lo, (uint32_t)(reg.data.u64 & 0xffffffff));166bld.loadImm(hi, (uint32_t)(reg.data.u64 >> 32));167168insn->op = OP_MERGE;169insn->setSrc(0, lo);170insn->setSrc(1, hi);171172return true;173}174175bool176LoweringHelper::handleNEG(Instruction *insn)177{178if (typeSizeof(insn->dType) != 8 || isFloatType(insn->dType))179return true;180181bld.setPosition(insn, false);182183insn->op = OP_SUB;184insn->setSrc(1, insn->getSrc(0));185insn->setSrc(0, bld.mkImm((uint64_t)0));186return true;187}188189bool190LoweringHelper::handleSAT(Instruction *insn)191{192DataType dTy = insn->dType;193194if (typeSizeof(dTy) != 8 || !isFloatType(dTy))195return true;196197bld.setPosition(insn, false);198199Value *tmp = bld.mkOp2v(OP_MAX, dTy, bld.getSSA(8), insn->getSrc(0), bld.loadImm(bld.getSSA(8), 0.0));200insn->op = OP_MIN;201insn->setSrc(0, tmp);202insn->setSrc(1, bld.loadImm(bld.getSSA(8), 1.0));203return true;204}205206bool207LoweringHelper::handleSLCT(CmpInstruction *insn)208{209DataType dTy = insn->dType;210DataType sTy = insn->sType;211212if (typeSizeof(dTy) != 8 || typeSizeof(sTy) == 8)213return true;214215CondCode cc = insn->getCondition();216DataType hdTy = typeOfSize(4, isFloatType(dTy), isSignedIntType(dTy));217bld.setPosition(insn, false);218219Value *src0[2];220Value *src1[2];221Value *def[2];222223bld.mkSplit(src0, 4, insn->getSrc(0));224bld.mkSplit(src1, 4, insn->getSrc(1));225226def[0] = bld.getSSA();227def[1] = bld.getSSA();228229bld.mkCmp(OP_SLCT, cc, hdTy, def[0], sTy, src0[0], src1[0], insn->getSrc(2));230bld.mkCmp(OP_SLCT, cc, hdTy, def[1], sTy, src0[1], src1[1], insn->getSrc(2));231232insn->op = OP_MERGE;233insn->setSrc(0, def[0]);234insn->setSrc(1, def[1]);235insn->setSrc(2, NULL);236237return true;238}239240bool241LoweringHelper::handleLogOp(Instruction *insn)242{243DataType dTy = insn->dType;244DataType sTy = typeOfSize(4, isFloatType(dTy), isSignedIntType(dTy));245246if (typeSizeof(dTy) != 8)247return true;248249bld.setPosition(insn, false);250251Value *src0[2];252Value *src1[2];253Value *def0 = bld.getSSA();254Value *def1 = bld.getSSA();255256bld.mkSplit(src0, 4, insn->getSrc(0));257if (insn->srcExists(1))258bld.mkSplit(src1, 4, insn->getSrc(1));259260Instruction *lo = bld.mkOp1(insn->op, sTy, def0, src0[0]);261Instruction *hi = bld.mkOp1(insn->op, sTy, def1, src0[1]);262if (insn->srcExists(1)) {263lo->setSrc(1, src1[0]);264hi->setSrc(1, src1[1]);265}266267insn->op = OP_MERGE;268insn->setSrc(0, def0);269insn->setSrc(1, def1);270271return true;272}273274} // namespace nv50_ir275276277