Path: blob/21.2-virgl/src/panfrost/midgard/midgard_ops.c
4564 views
/* Copyright (c) 2018-2019 Alyssa Rosenzweig ([email protected])1* Copyright (C) 2019-2020 Collabora, Ltd.2*3* Permission is hereby granted, free of charge, to any person obtaining a copy4* of this software and associated documentation files (the "Software"), to deal5* in the Software without restriction, including without limitation the rights6* to use, copy, modify, merge, publish, distribute, sublicense, and/or sell7* copies of the Software, and to permit persons to whom the Software is8* furnished to do so, subject to the following conditions:9*10* The above copyright notice and this permission notice shall be included in11* all copies or substantial portions of the Software.12*13* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR14* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,15* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE16* AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER17* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,18* OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN19* THE SOFTWARE.20*/2122#include "midgard.h"2324/* Include the definitions of the macros and such */2526#define MIDGARD_OPS_TABLE27#include "helpers.h"28#undef MIDGARD_OPS_TABLE2930/* Table of mapping opcodes to accompanying properties. This is used for both31* the disassembler and the compiler. It is placed in a .c file like this to32* avoid duplications in the binary */3334struct mir_op_props alu_opcode_props[256] = {35[midgard_alu_op_fadd] = {"FADD", UNITS_ADD | OP_COMMUTES},36[midgard_alu_op_fadd_rtz] = {"FADD.rtz", UNITS_ADD | OP_COMMUTES},37[midgard_alu_op_fadd_rtn] = {"FADD.rtn", UNITS_ADD | OP_COMMUTES},38[midgard_alu_op_fadd_rtp] = {"FADD.rtp", UNITS_ADD | OP_COMMUTES},39[midgard_alu_op_fmul] = {"FMUL", UNITS_MUL | UNIT_VLUT | OP_COMMUTES},40[midgard_alu_op_fmul_rtz] = {"FMUL.rtz", UNITS_MUL | UNIT_VLUT | OP_COMMUTES},41[midgard_alu_op_fmul_rtn] = {"FMUL.rtn", UNITS_MUL | UNIT_VLUT | OP_COMMUTES},42[midgard_alu_op_fmul_rtp] = {"FMUL.rtp", UNITS_MUL | UNIT_VLUT | OP_COMMUTES},43[midgard_alu_op_fmin] = {"FMIN", UNITS_MOST | OP_COMMUTES},44[midgard_alu_op_fmin_nan] = {"FMIN.nan", UNITS_MOST | OP_COMMUTES},45[midgard_alu_op_fabsmin] = {"FABSMIN", UNITS_MOST | OP_COMMUTES},46[midgard_alu_op_fabsmin_nan] = {"FABSMIN.nan", UNITS_MOST | OP_COMMUTES},47[midgard_alu_op_fmax] = {"FMAX", UNITS_MOST | OP_COMMUTES},48[midgard_alu_op_fmax_nan] = {"FMAX.nan", UNITS_MOST | OP_COMMUTES},49[midgard_alu_op_fabsmax] = {"FABSMAX", UNITS_MOST | OP_COMMUTES},50[midgard_alu_op_fabsmax_nan] = {"FABSMAX.nan", UNITS_MOST | OP_COMMUTES},51[midgard_alu_op_imin] = {"MIN", UNITS_MOST | OP_COMMUTES},52[midgard_alu_op_imax] = {"MAX", UNITS_MOST | OP_COMMUTES},53[midgard_alu_op_umin] = {"MIN", UNITS_MOST | OP_COMMUTES},54[midgard_alu_op_umax] = {"MAX", UNITS_MOST | OP_COMMUTES},55[midgard_alu_op_iavg] = {"AVG.rtz", UNITS_ADD | OP_COMMUTES},56[midgard_alu_op_uavg] = {"AVG.rtz", UNITS_ADD | OP_COMMUTES},57[midgard_alu_op_iravg] = {"AVG.round", UNITS_ADD | OP_COMMUTES},58[midgard_alu_op_uravg] = {"AVG.round", UNITS_ADD | OP_COMMUTES},5960[midgard_alu_op_fmov] = {"FMOV", UNITS_ALL | QUIRK_FLIPPED_R24},61[midgard_alu_op_fmov_rtz] = {"FMOV.rtz", UNITS_ALL | QUIRK_FLIPPED_R24},62[midgard_alu_op_fmov_rtn] = {"FMOV.rtn", UNITS_ALL | QUIRK_FLIPPED_R24},63[midgard_alu_op_fmov_rtp] = {"FMOV.rtp", UNITS_ALL | QUIRK_FLIPPED_R24},64[midgard_alu_op_froundaway] = {"FROUNDAWAY", UNITS_ADD},65[midgard_alu_op_froundeven] = {"FROUNDEVEN", UNITS_ADD},66[midgard_alu_op_ftrunc] = {"FTRUNC", UNITS_ADD},67[midgard_alu_op_ffloor] = {"FFLOOR", UNITS_ADD},68[midgard_alu_op_fceil] = {"FCEIL", UNITS_ADD},6970/* Multiplies the X/Y components of the first arg and adds the second71* arg. Like other LUTs, it must be scalarized. */72[midgard_alu_op_ffma] = {"FMA", UNIT_VLUT},73[midgard_alu_op_ffma_rtz] = {"FMA.rtz", UNIT_VLUT},74[midgard_alu_op_ffma_rtn] = {"FMA.rtn", UNIT_VLUT},75[midgard_alu_op_ffma_rtp] = {"FMA.rtp", UNIT_VLUT},7677/* Though they output a scalar, they need to run on a vector unit78* since they process vectors */79[midgard_alu_op_fdot3] = {"FDOT3", UNIT_VMUL | OP_CHANNEL_COUNT(3) | OP_COMMUTES},80[midgard_alu_op_fdot3r] = {"FDOT3R", UNIT_VMUL | OP_CHANNEL_COUNT(3) | OP_COMMUTES},81[midgard_alu_op_fdot4] = {"FDOT4", UNIT_VMUL | OP_CHANNEL_COUNT(4) | OP_COMMUTES},8283/* Incredibly, iadd can run on vmul, etc */84[midgard_alu_op_iadd] = {"ADD", UNITS_MOST | OP_COMMUTES},85[midgard_alu_op_ishladd] = {"ADD", UNITS_MUL},86[midgard_alu_op_iaddsat] = {"ADDSAT", UNITS_ADD | OP_COMMUTES},87[midgard_alu_op_uaddsat] = {"ADDSAT", UNITS_ADD | OP_COMMUTES},88[midgard_alu_op_uabsdiff] = {"ABSDIFF", UNITS_ADD},89[midgard_alu_op_iabsdiff] = {"ABSDIFF", UNITS_ADD},90[midgard_alu_op_ichoose] = {"CHOOSE", UNITS_ADD},91[midgard_alu_op_isub] = {"SUB", UNITS_MOST},92[midgard_alu_op_ishlsub] = {"SUB", UNITS_MUL},93[midgard_alu_op_isubsat] = {"SUBSAT", UNITS_ADD},94[midgard_alu_op_usubsat] = {"SUBSAT", UNITS_ADD},95[midgard_alu_op_imul] = {"MUL", UNITS_MUL | OP_COMMUTES},96[midgard_alu_op_iwmul] = {"WMUL.s", UNIT_VMUL | OP_COMMUTES},97[midgard_alu_op_uwmul] = {"WMUL.u", UNIT_VMUL | OP_COMMUTES},98[midgard_alu_op_iuwmul] = {"WMUL.su", UNIT_VMUL | OP_COMMUTES},99[midgard_alu_op_imov] = {"MOV", UNITS_ALL | QUIRK_FLIPPED_R24},100101/* For vector comparisons, use ball etc */102[midgard_alu_op_feq] = {"FCMP.eq", UNITS_MOST | OP_TYPE_CONVERT | OP_COMMUTES},103[midgard_alu_op_fne] = {"FCMP.ne", UNITS_MOST | OP_TYPE_CONVERT | OP_COMMUTES},104[midgard_alu_op_fle] = {"FCMP.le", UNITS_MOST | OP_TYPE_CONVERT},105[midgard_alu_op_flt] = {"FCMP.lt", UNITS_MOST | OP_TYPE_CONVERT},106[midgard_alu_op_ieq] = {"CMP.eq", UNITS_MOST | OP_COMMUTES},107[midgard_alu_op_ine] = {"CMP.ne", UNITS_MOST | OP_COMMUTES},108[midgard_alu_op_ilt] = {"CMP.lt", UNITS_MOST},109[midgard_alu_op_ile] = {"CMP.le", UNITS_MOST},110[midgard_alu_op_ult] = {"CMP.lt", UNITS_MOST},111[midgard_alu_op_ule] = {"CMP.le", UNITS_MOST},112113/* csel must run in the second pipeline stage (condition written in first) */114[midgard_alu_op_icsel] = {"CSEL.scalar", UNIT_VADD | UNIT_SMUL},115[midgard_alu_op_icsel_v] = {"CSEL.vector", UNIT_VADD | UNIT_SMUL}, /* Acts as bitselect() */116[midgard_alu_op_fcsel_v] = {"FCSEL.vector", UNIT_VADD | UNIT_SMUL},117[midgard_alu_op_fcsel] = {"FCSEL.scalar", UNIT_VADD | UNIT_SMUL},118119[midgard_alu_op_frcp] = {"FRCP", UNIT_VLUT},120[midgard_alu_op_frsqrt] = {"FRSQRT", UNIT_VLUT},121[midgard_alu_op_fsqrt] = {"FSQRT", UNIT_VLUT},122[midgard_alu_op_fpow_pt1] = {"FPOW_PT1", UNIT_VLUT},123[midgard_alu_op_fpown_pt1] = {"FPOWN_PT1", UNIT_VLUT},124[midgard_alu_op_fpowr_pt1] = {"FPOWR_PT1", UNIT_VLUT},125[midgard_alu_op_fexp2] = {"FEXP2", UNIT_VLUT},126[midgard_alu_op_flog2] = {"FLOG2", UNIT_VLUT},127128[midgard_alu_op_f2i_rte] = {"F2I", UNITS_ADD | OP_TYPE_CONVERT | MIDGARD_ROUNDS},129[midgard_alu_op_f2i_rtz] = {"F2I.rtz", UNITS_ADD | OP_TYPE_CONVERT},130[midgard_alu_op_f2i_rtn] = {"F2I.rtn", UNITS_ADD | OP_TYPE_CONVERT},131[midgard_alu_op_f2i_rtp] = {"F2I.rtp", UNITS_ADD | OP_TYPE_CONVERT},132[midgard_alu_op_f2u_rte] = {"F2U", UNITS_ADD | OP_TYPE_CONVERT | MIDGARD_ROUNDS},133[midgard_alu_op_f2u_rtz] = {"F2U.rtz", UNITS_ADD | OP_TYPE_CONVERT},134[midgard_alu_op_f2u_rtn] = {"F2U.rtn", UNITS_ADD | OP_TYPE_CONVERT},135[midgard_alu_op_f2u_rtp] = {"F2U.rtp", UNITS_ADD | OP_TYPE_CONVERT},136[midgard_alu_op_i2f_rte] = {"I2F", UNITS_ADD | OP_TYPE_CONVERT},137[midgard_alu_op_i2f_rtz] = {"I2F.rtz", UNITS_ADD | OP_TYPE_CONVERT},138[midgard_alu_op_i2f_rtn] = {"I2F.rtn", UNITS_ADD | OP_TYPE_CONVERT},139[midgard_alu_op_i2f_rtp] = {"I2F.rtp", UNITS_ADD | OP_TYPE_CONVERT},140[midgard_alu_op_u2f_rte] = {"U2F", UNITS_ADD | OP_TYPE_CONVERT},141[midgard_alu_op_u2f_rtz] = {"U2F.rtz", UNITS_ADD | OP_TYPE_CONVERT},142[midgard_alu_op_u2f_rtn] = {"U2F.rtn", UNITS_ADD | OP_TYPE_CONVERT},143[midgard_alu_op_u2f_rtp] = {"U2F.rtp", UNITS_ADD | OP_TYPE_CONVERT},144145[midgard_alu_op_fsinpi] = {"FSINPI", UNIT_VLUT},146[midgard_alu_op_fcospi] = {"FCOSPI", UNIT_VLUT},147148[midgard_alu_op_iand] = {"AND", UNITS_MOST | OP_COMMUTES},149[midgard_alu_op_iandnot] = {"ANDNOT", UNITS_MOST},150151[midgard_alu_op_ior] = {"OR", UNITS_MOST | OP_COMMUTES},152[midgard_alu_op_iornot] = {"ORNOT", UNITS_MOST | OP_COMMUTES},153[midgard_alu_op_inor] = {"NOR", UNITS_MOST | OP_COMMUTES},154[midgard_alu_op_ixor] = {"XOR", UNITS_MOST | OP_COMMUTES},155[midgard_alu_op_inxor] = {"NXOR", UNITS_MOST | OP_COMMUTES},156[midgard_alu_op_iclz] = {"CLZ", UNITS_ADD},157[midgard_alu_op_ipopcnt] = {"POPCNT", UNIT_VADD},158[midgard_alu_op_inand] = {"NAND", UNITS_MOST},159[midgard_alu_op_ishl] = {"SHL", UNITS_ADD},160[midgard_alu_op_ishlsat] = {"SHL.sat", UNITS_ADD},161[midgard_alu_op_ushlsat] = {"SHL.sat", UNITS_ADD},162[midgard_alu_op_iasr] = {"ASR", UNITS_ADD},163[midgard_alu_op_ilsr] = {"LSR", UNITS_ADD},164165[midgard_alu_op_fball_eq] = {"FCMP.all.eq", UNITS_VECTOR | OP_CHANNEL_COUNT(4) | OP_COMMUTES | OP_TYPE_CONVERT},166[midgard_alu_op_fball_neq] = {"FCMP.all.ne", UNITS_VECTOR | OP_CHANNEL_COUNT(4) | OP_COMMUTES | OP_TYPE_CONVERT},167[midgard_alu_op_fball_lt] = {"FCMP.all.lt", UNITS_VECTOR | OP_CHANNEL_COUNT(4) | OP_COMMUTES | OP_TYPE_CONVERT},168[midgard_alu_op_fball_lte] = {"FCMP.all.le", UNITS_VECTOR | OP_CHANNEL_COUNT(4) | OP_COMMUTES | OP_TYPE_CONVERT},169170[midgard_alu_op_fbany_eq] = {"FCMP.any.eq", UNITS_VECTOR | OP_CHANNEL_COUNT(4) | OP_COMMUTES | OP_TYPE_CONVERT},171[midgard_alu_op_fbany_neq] = {"FCMP.any.ne", UNITS_VECTOR | OP_CHANNEL_COUNT(4) | OP_COMMUTES | OP_TYPE_CONVERT},172[midgard_alu_op_fbany_lt] = {"FCMP.any.lt", UNITS_VECTOR | OP_CHANNEL_COUNT(4) | OP_COMMUTES | OP_TYPE_CONVERT},173[midgard_alu_op_fbany_lte] = {"FCMP.any.le", UNITS_VECTOR | OP_CHANNEL_COUNT(4) | OP_COMMUTES | OP_TYPE_CONVERT},174175[midgard_alu_op_iball_eq] = {"CMP.all.eq", UNITS_VECTOR | OP_CHANNEL_COUNT(4) | OP_COMMUTES},176[midgard_alu_op_iball_neq] = {"CMP.all.ne", UNITS_VECTOR | OP_CHANNEL_COUNT(4) | OP_COMMUTES},177[midgard_alu_op_iball_lt] = {"CMP.all.lt", UNITS_VECTOR | OP_CHANNEL_COUNT(4) | OP_COMMUTES},178[midgard_alu_op_iball_lte] = {"CMP.all.le", UNITS_VECTOR | OP_CHANNEL_COUNT(4) | OP_COMMUTES},179[midgard_alu_op_uball_lt] = {"CMP.all.lt", UNITS_VECTOR | OP_CHANNEL_COUNT(4) | OP_COMMUTES},180[midgard_alu_op_uball_lte] = {"CMP.all.le", UNITS_VECTOR | OP_CHANNEL_COUNT(4) | OP_COMMUTES},181182[midgard_alu_op_ibany_eq] = {"CMP.any.eq", UNITS_VECTOR | OP_CHANNEL_COUNT(4) | OP_COMMUTES},183[midgard_alu_op_ibany_neq] = {"CMP.any.ne", UNITS_VECTOR | OP_CHANNEL_COUNT(4) | OP_COMMUTES},184[midgard_alu_op_ibany_lt] = {"CMP.any.lt", UNITS_VECTOR | OP_CHANNEL_COUNT(4) | OP_COMMUTES},185[midgard_alu_op_ibany_lte] = {"CMP.any.le", UNITS_VECTOR | OP_CHANNEL_COUNT(4) | OP_COMMUTES},186[midgard_alu_op_ubany_lt] = {"CMP.any.lt", UNITS_VECTOR | OP_CHANNEL_COUNT(4) | OP_COMMUTES},187[midgard_alu_op_ubany_lte] = {"CMP.any.le", UNITS_VECTOR | OP_CHANNEL_COUNT(4) | OP_COMMUTES},188189[midgard_alu_op_fatan2_pt1] = {"FATAN2_PT1", UNIT_VLUT},190[midgard_alu_op_fatan2_pt2] = {"FATAN2_PT2", UNIT_VLUT},191192/* Haven't seen in a while */193[midgard_alu_op_freduce] = {"FREDUCE", 0},194};195196/* Define shorthands */197198#define M8 midgard_reg_mode_8199#define M16 midgard_reg_mode_16200#define M32 midgard_reg_mode_32201#define M64 midgard_reg_mode_64202203struct mir_ldst_op_props load_store_opcode_props[256] = {204[midgard_op_unpack_colour_f32] = {"UNPACK.f32", M32},205[midgard_op_unpack_colour_f16] = {"UNPACK.f16", M32},206[midgard_op_unpack_colour_u32] = {"UNPACK.u32", M32},207[midgard_op_unpack_colour_s32] = {"UNPACK.s32", M32},208[midgard_op_pack_colour_f32] = {"PACK.f32", M32},209[midgard_op_pack_colour_f16] = {"PACK.f16", M32},210[midgard_op_pack_colour_u32] = {"PACK.u32", M32},211[midgard_op_pack_colour_s32] = {"PACK.s32", M32},212[midgard_op_lea] = {"LEA", M32 | LDST_ADDRESS },213[midgard_op_lea_image] = {"LEA_IMAGE", M32 | LDST_ATTRIB },214[midgard_op_ld_cubemap_coords] = {"CUBEMAP", M32},215[midgard_op_ldst_mov] = {"LDST_MOV", M32},216[midgard_op_ldst_perspective_div_y] = {"LDST_PERSPECTIVE_DIV_Y", M32},217[midgard_op_ldst_perspective_div_z] = {"LDST_PERSPECTIVE_DIV_Z", M32},218[midgard_op_ldst_perspective_div_w] = {"LDST_PERSPECTIVE_DIV_W", M32},219220[midgard_op_atomic_add] = {"AADD.32", M32 | LDST_SIDE_FX | LDST_ADDRESS | LDST_ATOMIC},221[midgard_op_atomic_and] = {"AAND.32", M32 | LDST_SIDE_FX | LDST_ADDRESS | LDST_ATOMIC},222[midgard_op_atomic_or] = {"AOR.32", M32 | LDST_SIDE_FX | LDST_ADDRESS | LDST_ATOMIC},223[midgard_op_atomic_xor] = {"AXOR.32", M32 | LDST_SIDE_FX | LDST_ADDRESS | LDST_ATOMIC},224[midgard_op_atomic_imin] = {"AMIN.s32", M32 | LDST_SIDE_FX | LDST_ADDRESS | LDST_ATOMIC},225[midgard_op_atomic_umin] = {"AMIN.u32", M32 | LDST_SIDE_FX | LDST_ADDRESS | LDST_ATOMIC},226[midgard_op_atomic_imax] = {"AMAX.s32", M32 | LDST_SIDE_FX | LDST_ADDRESS | LDST_ATOMIC},227[midgard_op_atomic_umax] = {"AMAX.u32", M32 | LDST_SIDE_FX | LDST_ADDRESS | LDST_ATOMIC},228[midgard_op_atomic_xchg] = {"XCHG.32", M32 | LDST_SIDE_FX | LDST_ADDRESS | LDST_ATOMIC},229[midgard_op_atomic_cmpxchg] = {"CMPXCHG.32", M32 | LDST_SIDE_FX | LDST_ADDRESS | LDST_ATOMIC},230231[midgard_op_atomic_add64] = {"AADD.64", M64 | LDST_SIDE_FX | LDST_ADDRESS | LDST_ATOMIC},232[midgard_op_atomic_and64] = {"AAND.64", M64 | LDST_SIDE_FX | LDST_ADDRESS | LDST_ATOMIC},233[midgard_op_atomic_or64] = {"AOR.64", M64 | LDST_SIDE_FX | LDST_ADDRESS | LDST_ATOMIC},234[midgard_op_atomic_xor64] = {"AXOR.64", M64 | LDST_SIDE_FX | LDST_ADDRESS | LDST_ATOMIC},235[midgard_op_atomic_imin64] = {"AMIN.s64", M64 | LDST_SIDE_FX | LDST_ADDRESS | LDST_ATOMIC},236[midgard_op_atomic_umin64] = {"AMIN.u64", M64 | LDST_SIDE_FX | LDST_ADDRESS | LDST_ATOMIC},237[midgard_op_atomic_imax64] = {"AMAX.s64", M64 | LDST_SIDE_FX | LDST_ADDRESS | LDST_ATOMIC},238[midgard_op_atomic_umax64] = {"AMAX.u64", M64 | LDST_SIDE_FX | LDST_ADDRESS | LDST_ATOMIC},239[midgard_op_atomic_xchg64] = {"XCHG.64", M64 | LDST_SIDE_FX | LDST_ADDRESS | LDST_ATOMIC},240[midgard_op_atomic_cmpxchg64] = {"CMPXCHG.64", M64 | LDST_SIDE_FX | LDST_ADDRESS | LDST_ATOMIC},241242[midgard_op_atomic_add_be] = {"AADD.32.be", M32 | LDST_SIDE_FX | LDST_ADDRESS | LDST_ATOMIC},243[midgard_op_atomic_and_be] = {"AAND.32.be", M32 | LDST_SIDE_FX | LDST_ADDRESS | LDST_ATOMIC},244[midgard_op_atomic_or_be] = {"AOR.32.be", M32 | LDST_SIDE_FX | LDST_ADDRESS | LDST_ATOMIC},245[midgard_op_atomic_xor_be] = {"AXOR.32.be", M32 | LDST_SIDE_FX | LDST_ADDRESS | LDST_ATOMIC},246[midgard_op_atomic_imin_be] = {"AMIN.s32.be", M32 | LDST_SIDE_FX | LDST_ADDRESS | LDST_ATOMIC},247[midgard_op_atomic_umin_be] = {"AMIN.u32.be", M32 | LDST_SIDE_FX | LDST_ADDRESS | LDST_ATOMIC},248[midgard_op_atomic_imax_be] = {"AMAX.s32.be", M32 | LDST_SIDE_FX | LDST_ADDRESS | LDST_ATOMIC},249[midgard_op_atomic_umax_be] = {"AMAX.u32.be", M32 | LDST_SIDE_FX | LDST_ADDRESS | LDST_ATOMIC},250[midgard_op_atomic_xchg_be] = {"XCHG.32.be", M32 | LDST_SIDE_FX | LDST_ADDRESS | LDST_ATOMIC},251[midgard_op_atomic_cmpxchg_be] = {"CMPXCHG.32.be", M32 | LDST_SIDE_FX | LDST_ADDRESS | LDST_ATOMIC},252253[midgard_op_atomic_add64] = {"AADD.64.be", M64 | LDST_SIDE_FX | LDST_ADDRESS | LDST_ATOMIC},254[midgard_op_atomic_and64] = {"AAND.64.be", M64 | LDST_SIDE_FX | LDST_ADDRESS | LDST_ATOMIC},255[midgard_op_atomic_or64] = {"AOR.64.be", M64 | LDST_SIDE_FX | LDST_ADDRESS | LDST_ATOMIC},256[midgard_op_atomic_xor64] = {"AXOR.64.be", M64 | LDST_SIDE_FX | LDST_ADDRESS | LDST_ATOMIC},257[midgard_op_atomic_imin64] = {"AMIN.s64.be", M64 | LDST_SIDE_FX | LDST_ADDRESS | LDST_ATOMIC},258[midgard_op_atomic_umin64] = {"AMIN.u64.be", M64 | LDST_SIDE_FX | LDST_ADDRESS | LDST_ATOMIC},259[midgard_op_atomic_imax64] = {"AMAX.s64.be", M64 | LDST_SIDE_FX | LDST_ADDRESS | LDST_ATOMIC},260[midgard_op_atomic_umax64] = {"AMAX.u64.be", M64 | LDST_SIDE_FX | LDST_ADDRESS | LDST_ATOMIC},261[midgard_op_atomic_xchg64] = {"XCHG.64.be", M64 | LDST_SIDE_FX | LDST_ADDRESS | LDST_ATOMIC},262[midgard_op_atomic_cmpxchg64] = {"CMPXCHG.64.be", M64 | LDST_SIDE_FX | LDST_ADDRESS | LDST_ATOMIC},263264[midgard_op_ld_u8] = {"LD.u8", M32 | LDST_ADDRESS},265[midgard_op_ld_i8] = {"LD.s8", M32 | LDST_ADDRESS},266[midgard_op_ld_u16] = {"LD.u16", M32 | LDST_ADDRESS},267[midgard_op_ld_i16] = {"LD.s16", M32 | LDST_ADDRESS},268[midgard_op_ld_u16_be] = {"LD.u16.be", M32 | LDST_ADDRESS},269[midgard_op_ld_i16_be] = {"LD.s16.be", M32 | LDST_ADDRESS},270[midgard_op_ld_32] = {"LD.32", M32 | LDST_ADDRESS},271[midgard_op_ld_32_bswap2] = {"LD.32.bswap2", M32 | LDST_ADDRESS},272[midgard_op_ld_32_bswap4] = {"LD.32.bswap4", M32 | LDST_ADDRESS},273[midgard_op_ld_64] = {"LD.64", M32 | LDST_ADDRESS},274[midgard_op_ld_64_bswap2] = {"LD.64.bswap2", M32 | LDST_ADDRESS},275[midgard_op_ld_64_bswap4] = {"LD.64.bswap4", M32 | LDST_ADDRESS},276[midgard_op_ld_64_bswap8] = {"LD.64.bswap8", M32 | LDST_ADDRESS},277[midgard_op_ld_128] = {"LD.128", M32 | LDST_ADDRESS},278[midgard_op_ld_128_bswap2] = {"LD.128.bswap2", M32 | LDST_ADDRESS},279[midgard_op_ld_128_bswap4] = {"LD.128.bswap4", M32 | LDST_ADDRESS},280[midgard_op_ld_128_bswap8] = {"LD.128.bswap8", M32 | LDST_ADDRESS},281282[midgard_op_ld_attr_32] = {"LD_ATTR.f32", M32 | LDST_ATTRIB},283[midgard_op_ld_attr_32i] = {"LD_ATTR.s32", M32 | LDST_ATTRIB},284[midgard_op_ld_attr_32u] = {"LD_ATTR.u32", M32 | LDST_ATTRIB},285[midgard_op_ld_attr_16] = {"LD_ATTR.f16", M32 | LDST_ATTRIB},286287[midgard_op_ld_vary_32] = {"LD_VARY.f32", M32 | LDST_ATTRIB},288[midgard_op_ld_vary_16] = {"LD_VARY.f16", M32 | LDST_ATTRIB},289[midgard_op_ld_vary_32i] = {"LD_VARY.s32", M32 | LDST_ATTRIB},290[midgard_op_ld_vary_32u] = {"LD_VARY.u32", M32 | LDST_ATTRIB},291292[midgard_op_ld_special_32f] = {"LD_SPECIAL.f32", M32 | LDST_SPECIAL_MASK},293[midgard_op_ld_special_16f] = {"LD_SPECIAL.f16", M16 | LDST_SPECIAL_MASK},294[midgard_op_ld_special_32u] = {"LD_SPECIAL.u32", M32},295[midgard_op_ld_special_32i] = {"LD_SPECIAL.s32", M32},296297[midgard_op_ld_tilebuffer_32f] = {"LD_TILEBUFFER.f32", M32},298[midgard_op_ld_tilebuffer_16f] = {"LD_TILEBUFFER.f16", M16},299[midgard_op_ld_tilebuffer_raw] = {"LD_TILEBUFFER.raw", M32},300301[midgard_op_ld_ubo_u8] = {"LD_UBO.u8", M32},302[midgard_op_ld_ubo_i8] = {"LD_UBO.s8", M32},303[midgard_op_ld_ubo_u16] = {"LD_UBO.u16", M16},304[midgard_op_ld_ubo_i16] = {"LD_UBO.s16", M16},305[midgard_op_ld_ubo_u16_be] = {"LD_UBO.u16.be", M16},306[midgard_op_ld_ubo_i16_be] = {"LD_UBO.s16.be", M16},307[midgard_op_ld_ubo_32] = {"LD_UBO.32", M32},308[midgard_op_ld_ubo_32_bswap2] = {"LD_UBO.32.bswap2", M32},309[midgard_op_ld_ubo_32_bswap4] = {"LD_UBO.32.bswap4", M32},310[midgard_op_ld_ubo_64] = {"LD_UBO.64", M32},311[midgard_op_ld_ubo_64_bswap2] = {"LD_UBO.64.bswap2", M32},312[midgard_op_ld_ubo_64_bswap4] = {"LD_UBO.64.bswap4", M32},313[midgard_op_ld_ubo_64_bswap8] = {"LD_UBO.64.bswap8", M32},314[midgard_op_ld_ubo_128] = {"LD_UBO.128", M32},315[midgard_op_ld_ubo_128_bswap2] = {"LD_UBO.128.bswap2", M32},316[midgard_op_ld_ubo_128_bswap4] = {"LD_UBO.128.bswap4", M32},317[midgard_op_ld_ubo_128_bswap8] = {"LD_UBO.128.bswap8", M32},318319[midgard_op_ld_image_32f] = {"LD_IMAGE.f32", M32 | LDST_ATTRIB},320[midgard_op_ld_image_16f] = {"LD_IMAGE.f16", M16 | LDST_ATTRIB},321[midgard_op_ld_image_32i] = {"LD_IMAGE.s32", M32 | LDST_ATTRIB},322[midgard_op_ld_image_32u] = {"LD_IMAGE.u32", M32 | LDST_ATTRIB},323324[midgard_op_st_u8] = {"ST.u8", M32 | LDST_STORE | LDST_ADDRESS},325[midgard_op_st_i8] = {"ST.s8", M32 | LDST_STORE | LDST_ADDRESS},326[midgard_op_st_u16] = {"ST.u16", M32 | LDST_STORE | LDST_ADDRESS},327[midgard_op_st_i16] = {"ST.s16", M32 | LDST_STORE | LDST_ADDRESS},328[midgard_op_st_u16_be] = {"ST.u16.be", M32 | LDST_STORE | LDST_ADDRESS},329[midgard_op_st_i16_be] = {"ST.s16.be", M32 | LDST_STORE | LDST_ADDRESS},330[midgard_op_st_32] = {"ST.32", M32 | LDST_STORE | LDST_ADDRESS},331[midgard_op_st_32_bswap2] = {"ST.32.bswap2", M32 | LDST_STORE | LDST_ADDRESS},332[midgard_op_st_32_bswap4] = {"ST.32.bswap4", M32 | LDST_STORE | LDST_ADDRESS},333[midgard_op_st_64] = {"ST.64", M32 | LDST_STORE | LDST_ADDRESS},334[midgard_op_st_64_bswap2] = {"ST.64.bswap2", M32 | LDST_STORE | LDST_ADDRESS},335[midgard_op_st_64_bswap4] = {"ST.64.bswap4", M32 | LDST_STORE | LDST_ADDRESS},336[midgard_op_st_64_bswap8] = {"ST.64.bswap8", M32 | LDST_STORE | LDST_ADDRESS},337[midgard_op_st_128] = {"ST.128", M32 | LDST_STORE | LDST_ADDRESS},338[midgard_op_st_128_bswap2] = {"ST.128.bswap2", M32 | LDST_STORE | LDST_ADDRESS},339[midgard_op_st_128_bswap4] = {"ST.128.bswap4", M32 | LDST_STORE | LDST_ADDRESS},340[midgard_op_st_128_bswap8] = {"ST.128.bswap8", M32 | LDST_STORE | LDST_ADDRESS},341342[midgard_op_st_vary_32] = {"ST_VARY.f32", M32 | LDST_STORE | LDST_ATTRIB},343[midgard_op_st_vary_32i] = {"ST_VARY.s32", M32 | LDST_STORE | LDST_ATTRIB},344[midgard_op_st_vary_32u] = {"ST_VARY.u32", M32 | LDST_STORE | LDST_ATTRIB},345[midgard_op_st_vary_16] = {"ST_VARY.f16", M16 | LDST_STORE | LDST_ATTRIB},346347[midgard_op_st_image_32f] = {"ST_IMAGE.f32", M32 | LDST_STORE | LDST_ATTRIB},348[midgard_op_st_image_16f] = {"ST_IMAGE.f16", M16 | LDST_STORE | LDST_ATTRIB},349[midgard_op_st_image_32i] = {"ST_IMAGE.u32", M32 | LDST_STORE | LDST_ATTRIB},350[midgard_op_st_image_32u] = {"ST_IMAGE.s32", M32 | LDST_STORE | LDST_ATTRIB},351352[midgard_op_st_special_32f] = {"ST_SPECIAL.f32", M32},353[midgard_op_st_special_16f] = {"ST_SPECIAL.f16", M16},354[midgard_op_st_special_32u] = {"ST_SPECIAL.u32", M32},355[midgard_op_st_special_32i] = {"ST_SPECIAL.s32", M32},356357[midgard_op_st_tilebuffer_32f] = {"ST_TILEBUFFER.f32", M32},358[midgard_op_st_tilebuffer_16f] = {"ST_TILEBUFFER.f16", M16},359[midgard_op_st_tilebuffer_raw] = {"ST_TILEBUFFER.raw", M32},360};361362struct mir_tex_op_props tex_opcode_props[256] = {363[midgard_tex_op_normal] = {"TEX", M32},364[midgard_tex_op_gradient] = {"TEX_GRAD", M32},365[midgard_tex_op_fetch] = {"TEX_FETCH", M32},366[midgard_tex_op_grad_from_derivative] = {"DER_TO_GRAD", M32},367[midgard_tex_op_grad_from_coords] = {"COORDS_TO_GRAD", M32},368[midgard_tex_op_mov] = {"MOV", M32},369[midgard_tex_op_barrier] = {"BARRIER", M32},370[midgard_tex_op_derivative] = {"DERIVATIVE", M32}371};372373#undef M8374#undef M16375#undef M32376#undef M64377378struct mir_tag_props midgard_tag_props[16] = {379[TAG_INVALID] = {"invalid", 0},380[TAG_BREAK] = {"break", 0},381[TAG_TEXTURE_4_VTX] = {"tex/vt", 1},382[TAG_TEXTURE_4] = {"tex", 1},383[TAG_TEXTURE_4_BARRIER] = {"tex/bar", 1},384[TAG_LOAD_STORE_4] = {"ldst", 1},385[TAG_UNKNOWN_1] = {"unk1", 1},386[TAG_UNKNOWN_2] = {"unk2", 1},387[TAG_ALU_4] = {"alu/4", 1},388[TAG_ALU_8] = {"alu/8", 2},389[TAG_ALU_12] = {"alu/12", 3},390[TAG_ALU_16] = {"alu/16", 4},391[TAG_ALU_4_WRITEOUT] = {"aluw/4", 1},392[TAG_ALU_8_WRITEOUT] = {"aluw/8", 2},393[TAG_ALU_12_WRITEOUT] = {"aluw/12", 3},394[TAG_ALU_16_WRITEOUT] = {"aluw/16", 4}395};396397398