Path: blob/21.2-virgl/src/freedreno/vulkan/tu_formats.c
4565 views
1/*2* Copyright © 2016 Red Hat.3* Copyright © 2016 Bas Nieuwenhuizen4*5* Permission is hereby granted, free of charge, to any person obtaining a6* copy of this software and associated documentation files (the "Software"),7* to deal in the Software without restriction, including without limitation8* the rights to use, copy, modify, merge, publish, distribute, sublicense,9* and/or sell copies of the Software, and to permit persons to whom the10* Software is furnished to do so, subject to the following conditions:11*12* The above copyright notice and this permission notice (including the next13* paragraph) shall be included in all copies or substantial portions of the14* Software.15*16* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR17* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,18* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL19* THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER20* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING21* FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER22* DEALINGS IN THE SOFTWARE.23*/2425#include "tu_private.h"2627#include "adreno_common.xml.h"28#include "a6xx.xml.h"2930#include "vk_format.h"31#include "vk_util.h"32#include "drm-uapi/drm_fourcc.h"3334#define TU6_FMT(vkfmt, hwfmt, swapfmt, valid) \35[VK_FORMAT_##vkfmt] = { \36.fmt = FMT6_##hwfmt, \37.swap = swapfmt, \38.supported = valid, \39}4041#define TU6_VTC(vk, fmt, swap) TU6_FMT(vk, fmt, swap, FMT_VERTEX | FMT_TEXTURE | FMT_COLOR)42#define TU6_xTC(vk, fmt, swap) TU6_FMT(vk, fmt, swap, FMT_TEXTURE | FMT_COLOR)43#define TU6_Vxx(vk, fmt, swap) TU6_FMT(vk, fmt, swap, FMT_VERTEX)44#define TU6_xTx(vk, fmt, swap) TU6_FMT(vk, fmt, swap, FMT_TEXTURE)45#define TU6_xxx(vk, fmt, swap) TU6_FMT(vk, NONE, WZYX, 0)4647static const struct tu_native_format tu6_format_table[] = {48TU6_xxx(UNDEFINED, x, x), /* 0 */4950/* 8-bit packed */51TU6_xxx(R4G4_UNORM_PACK8, 4_4_UNORM, WZXY), /* 1 */5253/* 16-bit packed */54TU6_xTC(R4G4B4A4_UNORM_PACK16, 4_4_4_4_UNORM, XYZW), /* 2 */55TU6_xTC(B4G4R4A4_UNORM_PACK16, 4_4_4_4_UNORM, ZYXW), /* 3 */56TU6_xTC(R5G6B5_UNORM_PACK16, 5_6_5_UNORM, WXYZ), /* 4 */57TU6_xTC(B5G6R5_UNORM_PACK16, 5_6_5_UNORM, WZYX), /* 5 */58TU6_xTC(R5G5B5A1_UNORM_PACK16, 5_5_5_1_UNORM, XYZW), /* 6 */59TU6_xTC(B5G5R5A1_UNORM_PACK16, 5_5_5_1_UNORM, ZYXW), /* 7 */60TU6_xTC(A1R5G5B5_UNORM_PACK16, 5_5_5_1_UNORM, WXYZ), /* 8 */6162/* 8-bit R */63TU6_VTC(R8_UNORM, 8_UNORM, WZYX), /* 9 */64TU6_VTC(R8_SNORM, 8_SNORM, WZYX), /* 10 */65TU6_Vxx(R8_USCALED, 8_UINT, WZYX), /* 11 */66TU6_Vxx(R8_SSCALED, 8_SINT, WZYX), /* 12 */67TU6_VTC(R8_UINT, 8_UINT, WZYX), /* 13 */68TU6_VTC(R8_SINT, 8_SINT, WZYX), /* 14 */69TU6_xTC(R8_SRGB, 8_UNORM, WZYX), /* 15 */7071/* 16-bit RG */72TU6_VTC(R8G8_UNORM, 8_8_UNORM, WZYX), /* 16 */73TU6_VTC(R8G8_SNORM, 8_8_SNORM, WZYX), /* 17 */74TU6_Vxx(R8G8_USCALED, 8_8_UINT, WZYX), /* 18 */75TU6_Vxx(R8G8_SSCALED, 8_8_SINT, WZYX), /* 19 */76TU6_VTC(R8G8_UINT, 8_8_UINT, WZYX), /* 20 */77TU6_VTC(R8G8_SINT, 8_8_SINT, WZYX), /* 21 */78TU6_xTC(R8G8_SRGB, 8_8_UNORM, WZYX), /* 22 */7980/* 24-bit RGB */81TU6_Vxx(R8G8B8_UNORM, 8_8_8_UNORM, WZYX), /* 23 */82TU6_Vxx(R8G8B8_SNORM, 8_8_8_SNORM, WZYX), /* 24 */83TU6_Vxx(R8G8B8_USCALED, 8_8_8_UINT, WZYX), /* 25 */84TU6_Vxx(R8G8B8_SSCALED, 8_8_8_SINT, WZYX), /* 26 */85TU6_Vxx(R8G8B8_UINT, 8_8_8_UINT, WZYX), /* 27 */86TU6_Vxx(R8G8B8_SINT, 8_8_8_SINT, WZYX), /* 28 */87TU6_xxx(R8G8B8_SRGB, 8_8_8_UNORM, WZYX), /* 29 */8889/* 24-bit BGR */90TU6_xxx(B8G8R8_UNORM, 8_8_8_UNORM, WXYZ), /* 30 */91TU6_xxx(B8G8R8_SNORM, 8_8_8_SNORM, WXYZ), /* 31 */92TU6_xxx(B8G8R8_USCALED, 8_8_8_UINT, WXYZ), /* 32 */93TU6_xxx(B8G8R8_SSCALED, 8_8_8_SINT, WXYZ), /* 33 */94TU6_xxx(B8G8R8_UINT, 8_8_8_UINT, WXYZ), /* 34 */95TU6_xxx(B8G8R8_SINT, 8_8_8_SINT, WXYZ), /* 35 */96TU6_xxx(B8G8R8_SRGB, 8_8_8_UNORM, WXYZ), /* 36 */9798/* 32-bit RGBA */99TU6_VTC(R8G8B8A8_UNORM, 8_8_8_8_UNORM, WZYX), /* 37 */100TU6_VTC(R8G8B8A8_SNORM, 8_8_8_8_SNORM, WZYX), /* 38 */101TU6_Vxx(R8G8B8A8_USCALED, 8_8_8_8_UINT, WZYX), /* 39 */102TU6_Vxx(R8G8B8A8_SSCALED, 8_8_8_8_SINT, WZYX), /* 40 */103TU6_VTC(R8G8B8A8_UINT, 8_8_8_8_UINT, WZYX), /* 41 */104TU6_VTC(R8G8B8A8_SINT, 8_8_8_8_SINT, WZYX), /* 42 */105TU6_xTC(R8G8B8A8_SRGB, 8_8_8_8_UNORM, WZYX), /* 43 */106107/* 32-bit BGRA */108TU6_VTC(B8G8R8A8_UNORM, 8_8_8_8_UNORM, WXYZ), /* 44 */109TU6_VTC(B8G8R8A8_SNORM, 8_8_8_8_SNORM, WXYZ), /* 45 */110TU6_Vxx(B8G8R8A8_USCALED, 8_8_8_8_UINT, WXYZ), /* 46 */111TU6_Vxx(B8G8R8A8_SSCALED, 8_8_8_8_SINT, WXYZ), /* 47 */112TU6_VTC(B8G8R8A8_UINT, 8_8_8_8_UINT, WXYZ), /* 48 */113TU6_VTC(B8G8R8A8_SINT, 8_8_8_8_SINT, WXYZ), /* 49 */114TU6_xTC(B8G8R8A8_SRGB, 8_8_8_8_UNORM, WXYZ), /* 50 */115116/* 32-bit packed */117TU6_VTC(A8B8G8R8_UNORM_PACK32, 8_8_8_8_UNORM, WZYX), /* 51 */118TU6_VTC(A8B8G8R8_SNORM_PACK32, 8_8_8_8_SNORM, WZYX), /* 52 */119TU6_Vxx(A8B8G8R8_USCALED_PACK32, 8_8_8_8_UINT, WZYX), /* 53 */120TU6_Vxx(A8B8G8R8_SSCALED_PACK32, 8_8_8_8_SINT, WZYX), /* 54 */121TU6_VTC(A8B8G8R8_UINT_PACK32, 8_8_8_8_UINT, WZYX), /* 55 */122TU6_VTC(A8B8G8R8_SINT_PACK32, 8_8_8_8_SINT, WZYX), /* 56 */123TU6_xTC(A8B8G8R8_SRGB_PACK32, 8_8_8_8_UNORM, WZYX), /* 57 */124TU6_VTC(A2R10G10B10_UNORM_PACK32, 10_10_10_2_UNORM, WXYZ), /* 58 */125TU6_Vxx(A2R10G10B10_SNORM_PACK32, 10_10_10_2_SNORM, WXYZ), /* 59 */126TU6_Vxx(A2R10G10B10_USCALED_PACK32, 10_10_10_2_UINT, WXYZ), /* 60 */127TU6_Vxx(A2R10G10B10_SSCALED_PACK32, 10_10_10_2_SINT, WXYZ), /* 61 */128TU6_VTC(A2R10G10B10_UINT_PACK32, 10_10_10_2_UINT, WXYZ), /* 62 */129TU6_Vxx(A2R10G10B10_SINT_PACK32, 10_10_10_2_SINT, WXYZ), /* 63 */130TU6_VTC(A2B10G10R10_UNORM_PACK32, 10_10_10_2_UNORM, WZYX), /* 64 */131TU6_Vxx(A2B10G10R10_SNORM_PACK32, 10_10_10_2_SNORM, WZYX), /* 65 */132TU6_Vxx(A2B10G10R10_USCALED_PACK32, 10_10_10_2_UINT, WZYX), /* 66 */133TU6_Vxx(A2B10G10R10_SSCALED_PACK32, 10_10_10_2_SINT, WZYX), /* 67 */134TU6_VTC(A2B10G10R10_UINT_PACK32, 10_10_10_2_UINT, WZYX), /* 68 */135TU6_Vxx(A2B10G10R10_SINT_PACK32, 10_10_10_2_SINT, WZYX), /* 69 */136137/* 16-bit R */138TU6_VTC(R16_UNORM, 16_UNORM, WZYX), /* 70 */139TU6_VTC(R16_SNORM, 16_SNORM, WZYX), /* 71 */140TU6_Vxx(R16_USCALED, 16_UINT, WZYX), /* 72 */141TU6_Vxx(R16_SSCALED, 16_SINT, WZYX), /* 73 */142TU6_VTC(R16_UINT, 16_UINT, WZYX), /* 74 */143TU6_VTC(R16_SINT, 16_SINT, WZYX), /* 75 */144TU6_VTC(R16_SFLOAT, 16_FLOAT, WZYX), /* 76 */145146/* 32-bit RG */147TU6_VTC(R16G16_UNORM, 16_16_UNORM, WZYX), /* 77 */148TU6_VTC(R16G16_SNORM, 16_16_SNORM, WZYX), /* 78 */149TU6_Vxx(R16G16_USCALED, 16_16_UINT, WZYX), /* 79 */150TU6_Vxx(R16G16_SSCALED, 16_16_SINT, WZYX), /* 80 */151TU6_VTC(R16G16_UINT, 16_16_UINT, WZYX), /* 81 */152TU6_VTC(R16G16_SINT, 16_16_SINT, WZYX), /* 82 */153TU6_VTC(R16G16_SFLOAT, 16_16_FLOAT, WZYX), /* 83 */154155/* 48-bit RGB */156TU6_Vxx(R16G16B16_UNORM, 16_16_16_UNORM, WZYX), /* 84 */157TU6_Vxx(R16G16B16_SNORM, 16_16_16_SNORM, WZYX), /* 85 */158TU6_Vxx(R16G16B16_USCALED, 16_16_16_UINT, WZYX), /* 86 */159TU6_Vxx(R16G16B16_SSCALED, 16_16_16_SINT, WZYX), /* 87 */160TU6_Vxx(R16G16B16_UINT, 16_16_16_UINT, WZYX), /* 88 */161TU6_Vxx(R16G16B16_SINT, 16_16_16_SINT, WZYX), /* 89 */162TU6_Vxx(R16G16B16_SFLOAT, 16_16_16_FLOAT, WZYX), /* 90 */163164/* 64-bit RGBA */165TU6_VTC(R16G16B16A16_UNORM, 16_16_16_16_UNORM, WZYX), /* 91 */166TU6_VTC(R16G16B16A16_SNORM, 16_16_16_16_SNORM, WZYX), /* 92 */167TU6_Vxx(R16G16B16A16_USCALED, 16_16_16_16_UINT, WZYX), /* 93 */168TU6_Vxx(R16G16B16A16_SSCALED, 16_16_16_16_SINT, WZYX), /* 94 */169TU6_VTC(R16G16B16A16_UINT, 16_16_16_16_UINT, WZYX), /* 95 */170TU6_VTC(R16G16B16A16_SINT, 16_16_16_16_SINT, WZYX), /* 96 */171TU6_VTC(R16G16B16A16_SFLOAT, 16_16_16_16_FLOAT, WZYX), /* 97 */172173/* 32-bit R */174TU6_VTC(R32_UINT, 32_UINT, WZYX), /* 98 */175TU6_VTC(R32_SINT, 32_SINT, WZYX), /* 99 */176TU6_VTC(R32_SFLOAT, 32_FLOAT, WZYX), /* 100 */177178/* 64-bit RG */179TU6_VTC(R32G32_UINT, 32_32_UINT, WZYX), /* 101 */180TU6_VTC(R32G32_SINT, 32_32_SINT, WZYX), /* 102 */181TU6_VTC(R32G32_SFLOAT, 32_32_FLOAT, WZYX), /* 103 */182183/* 96-bit RGB */184TU6_Vxx(R32G32B32_UINT, 32_32_32_UINT, WZYX), /* 104 */185TU6_Vxx(R32G32B32_SINT, 32_32_32_SINT, WZYX), /* 105 */186TU6_Vxx(R32G32B32_SFLOAT, 32_32_32_FLOAT, WZYX), /* 106 */187188/* 128-bit RGBA */189TU6_VTC(R32G32B32A32_UINT, 32_32_32_32_UINT, WZYX), /* 107 */190TU6_VTC(R32G32B32A32_SINT, 32_32_32_32_SINT, WZYX), /* 108 */191TU6_VTC(R32G32B32A32_SFLOAT, 32_32_32_32_FLOAT, WZYX), /* 109 */192193/* 64-bit R */194TU6_xxx(R64_UINT, 64_UINT, WZYX), /* 110 */195TU6_xxx(R64_SINT, 64_SINT, WZYX), /* 111 */196TU6_xxx(R64_SFLOAT, 64_FLOAT, WZYX), /* 112 */197198/* 128-bit RG */199TU6_xxx(R64G64_UINT, 64_64_UINT, WZYX), /* 113 */200TU6_xxx(R64G64_SINT, 64_64_SINT, WZYX), /* 114 */201TU6_xxx(R64G64_SFLOAT, 64_64_FLOAT, WZYX), /* 115 */202203/* 192-bit RGB */204TU6_xxx(R64G64B64_UINT, 64_64_64_UINT, WZYX), /* 116 */205TU6_xxx(R64G64B64_SINT, 64_64_64_SINT, WZYX), /* 117 */206TU6_xxx(R64G64B64_SFLOAT, 64_64_64_FLOAT, WZYX), /* 118 */207208/* 256-bit RGBA */209TU6_xxx(R64G64B64A64_UINT, 64_64_64_64_UINT, WZYX), /* 119 */210TU6_xxx(R64G64B64A64_SINT, 64_64_64_64_SINT, WZYX), /* 120 */211TU6_xxx(R64G64B64A64_SFLOAT, 64_64_64_64_FLOAT, WZYX), /* 121 */212213/* 32-bit packed float */214TU6_VTC(B10G11R11_UFLOAT_PACK32, 11_11_10_FLOAT, WZYX), /* 122 */215TU6_xTx(E5B9G9R9_UFLOAT_PACK32, 9_9_9_E5_FLOAT, WZYX), /* 123 */216217/* depth/stencil218* X8_D24_UNORM/D24_UNORM_S8_UINT should be Z24_UNORM_S8_UINT_AS_R8G8B8A8219* but the format doesn't work on A630 when UBWC is disabled, so use220* 8_8_8_8_UNORM as the default and override it when UBWC is enabled221*/222TU6_xTC(D16_UNORM, 16_UNORM, WZYX), /* 124 */223TU6_xTC(X8_D24_UNORM_PACK32, 8_8_8_8_UNORM, WZYX), /* 125 */224TU6_xTC(D32_SFLOAT, 32_FLOAT, WZYX), /* 126 */225TU6_xTC(S8_UINT, 8_UINT, WZYX), /* 127 */226TU6_xxx(D16_UNORM_S8_UINT, X8Z16_UNORM, WZYX), /* 128 */227TU6_xTC(D24_UNORM_S8_UINT, 8_8_8_8_UNORM, WZYX), /* 129 */228TU6_xTC(D32_SFLOAT_S8_UINT, NONE, WZYX), /* 130 */229230/* compressed */231TU6_xTx(BC1_RGB_UNORM_BLOCK, DXT1, WZYX), /* 131 */232TU6_xTx(BC1_RGB_SRGB_BLOCK, DXT1, WZYX), /* 132 */233TU6_xTx(BC1_RGBA_UNORM_BLOCK, DXT1, WZYX), /* 133 */234TU6_xTx(BC1_RGBA_SRGB_BLOCK, DXT1, WZYX), /* 134 */235TU6_xTx(BC2_UNORM_BLOCK, DXT3, WZYX), /* 135 */236TU6_xTx(BC2_SRGB_BLOCK, DXT3, WZYX), /* 136 */237TU6_xTx(BC3_UNORM_BLOCK, DXT5, WZYX), /* 137 */238TU6_xTx(BC3_SRGB_BLOCK, DXT5, WZYX), /* 138 */239TU6_xTx(BC4_UNORM_BLOCK, RGTC1_UNORM, WZYX), /* 139 */240TU6_xTx(BC4_SNORM_BLOCK, RGTC1_SNORM, WZYX), /* 140 */241TU6_xTx(BC5_UNORM_BLOCK, RGTC2_UNORM, WZYX), /* 141 */242TU6_xTx(BC5_SNORM_BLOCK, RGTC2_SNORM, WZYX), /* 142 */243TU6_xTx(BC6H_UFLOAT_BLOCK, BPTC_UFLOAT, WZYX), /* 143 */244TU6_xTx(BC6H_SFLOAT_BLOCK, BPTC_FLOAT, WZYX), /* 144 */245TU6_xTx(BC7_UNORM_BLOCK, BPTC, WZYX), /* 145 */246TU6_xTx(BC7_SRGB_BLOCK, BPTC, WZYX), /* 146 */247TU6_xTx(ETC2_R8G8B8_UNORM_BLOCK, ETC2_RGB8, WZYX), /* 147 */248TU6_xTx(ETC2_R8G8B8_SRGB_BLOCK, ETC2_RGB8, WZYX), /* 148 */249TU6_xTx(ETC2_R8G8B8A1_UNORM_BLOCK, ETC2_RGB8A1, WZYX), /* 149 */250TU6_xTx(ETC2_R8G8B8A1_SRGB_BLOCK, ETC2_RGB8A1, WZYX), /* 150 */251TU6_xTx(ETC2_R8G8B8A8_UNORM_BLOCK, ETC2_RGBA8, WZYX), /* 151 */252TU6_xTx(ETC2_R8G8B8A8_SRGB_BLOCK, ETC2_RGBA8, WZYX), /* 152 */253TU6_xTx(EAC_R11_UNORM_BLOCK, ETC2_R11_UNORM, WZYX), /* 153 */254TU6_xTx(EAC_R11_SNORM_BLOCK, ETC2_R11_SNORM, WZYX), /* 154 */255TU6_xTx(EAC_R11G11_UNORM_BLOCK, ETC2_RG11_UNORM, WZYX), /* 155 */256TU6_xTx(EAC_R11G11_SNORM_BLOCK, ETC2_RG11_SNORM, WZYX), /* 156 */257TU6_xTx(ASTC_4x4_UNORM_BLOCK, ASTC_4x4, WZYX), /* 157 */258TU6_xTx(ASTC_4x4_SRGB_BLOCK, ASTC_4x4, WZYX), /* 158 */259TU6_xTx(ASTC_5x4_UNORM_BLOCK, ASTC_5x4, WZYX), /* 159 */260TU6_xTx(ASTC_5x4_SRGB_BLOCK, ASTC_5x4, WZYX), /* 160 */261TU6_xTx(ASTC_5x5_UNORM_BLOCK, ASTC_5x5, WZYX), /* 161 */262TU6_xTx(ASTC_5x5_SRGB_BLOCK, ASTC_5x5, WZYX), /* 162 */263TU6_xTx(ASTC_6x5_UNORM_BLOCK, ASTC_6x5, WZYX), /* 163 */264TU6_xTx(ASTC_6x5_SRGB_BLOCK, ASTC_6x5, WZYX), /* 164 */265TU6_xTx(ASTC_6x6_UNORM_BLOCK, ASTC_6x6, WZYX), /* 165 */266TU6_xTx(ASTC_6x6_SRGB_BLOCK, ASTC_6x6, WZYX), /* 166 */267TU6_xTx(ASTC_8x5_UNORM_BLOCK, ASTC_8x5, WZYX), /* 167 */268TU6_xTx(ASTC_8x5_SRGB_BLOCK, ASTC_8x5, WZYX), /* 168 */269TU6_xTx(ASTC_8x6_UNORM_BLOCK, ASTC_8x6, WZYX), /* 169 */270TU6_xTx(ASTC_8x6_SRGB_BLOCK, ASTC_8x6, WZYX), /* 170 */271TU6_xTx(ASTC_8x8_UNORM_BLOCK, ASTC_8x8, WZYX), /* 171 */272TU6_xTx(ASTC_8x8_SRGB_BLOCK, ASTC_8x8, WZYX), /* 172 */273TU6_xTx(ASTC_10x5_UNORM_BLOCK, ASTC_10x5, WZYX), /* 173 */274TU6_xTx(ASTC_10x5_SRGB_BLOCK, ASTC_10x5, WZYX), /* 174 */275TU6_xTx(ASTC_10x6_UNORM_BLOCK, ASTC_10x6, WZYX), /* 175 */276TU6_xTx(ASTC_10x6_SRGB_BLOCK, ASTC_10x6, WZYX), /* 176 */277TU6_xTx(ASTC_10x8_UNORM_BLOCK, ASTC_10x8, WZYX), /* 177 */278TU6_xTx(ASTC_10x8_SRGB_BLOCK, ASTC_10x8, WZYX), /* 178 */279TU6_xTx(ASTC_10x10_UNORM_BLOCK, ASTC_10x10, WZYX), /* 179 */280TU6_xTx(ASTC_10x10_SRGB_BLOCK, ASTC_10x10, WZYX), /* 180 */281TU6_xTx(ASTC_12x10_UNORM_BLOCK, ASTC_12x10, WZYX), /* 181 */282TU6_xTx(ASTC_12x10_SRGB_BLOCK, ASTC_12x10, WZYX), /* 182 */283TU6_xTx(ASTC_12x12_UNORM_BLOCK, ASTC_12x12, WZYX), /* 183 */284TU6_xTx(ASTC_12x12_SRGB_BLOCK, ASTC_12x12, WZYX), /* 184 */285};286287#undef TU6_FMT288#define TU6_FMT(vkfmt, hwfmt, swapfmt, valid) \289case VK_FORMAT_##vkfmt: \290fmt = (struct tu_native_format) { \291.fmt = FMT6_##hwfmt, \292.swap = swapfmt, \293.supported = valid, \294}; break;295296static struct tu_native_format297tu6_get_native_format(VkFormat format)298{299struct tu_native_format fmt = {};300301if (format < ARRAY_SIZE(tu6_format_table)) {302fmt = tu6_format_table[format];303} else {304switch (format) {305TU6_xTx(G8B8G8R8_422_UNORM, R8G8R8B8_422_UNORM, WZYX)306TU6_xTx(B8G8R8G8_422_UNORM, G8R8B8R8_422_UNORM, WZYX)307TU6_xTx(G8_B8_R8_3PLANE_420_UNORM, R8_G8_B8_3PLANE_420_UNORM, WZYX)308TU6_xTx(G8_B8R8_2PLANE_420_UNORM, R8_G8B8_2PLANE_420_UNORM, WZYX)309TU6_xTC(A4R4G4B4_UNORM_PACK16_EXT, 4_4_4_4_UNORM, WXYZ)310TU6_xTC(A4B4G4R4_UNORM_PACK16_EXT, 4_4_4_4_UNORM, WZYX)311default:312break;313}314}315316if (fmt.supported && vk_format_to_pipe_format(format) == PIPE_FORMAT_NONE) {317tu_finishme("vk_format %d missing matching pipe format.\n", format);318fmt.supported = false;319}320321return fmt;322}323324struct tu_native_format325tu6_format_vtx(VkFormat format)326{327struct tu_native_format fmt = tu6_get_native_format(format);328assert(fmt.supported & FMT_VERTEX);329return fmt;330}331332struct tu_native_format333tu6_format_color(VkFormat format, enum a6xx_tile_mode tile_mode)334{335struct tu_native_format fmt = tu6_get_native_format(format);336assert(fmt.supported & FMT_COLOR);337338if (fmt.fmt == FMT6_10_10_10_2_UNORM)339fmt.fmt = FMT6_10_10_10_2_UNORM_DEST;340341if (tile_mode)342fmt.swap = WZYX;343344return fmt;345}346347struct tu_native_format348tu6_format_texture(VkFormat format, enum a6xx_tile_mode tile_mode)349{350struct tu_native_format fmt = tu6_get_native_format(format);351assert(fmt.supported & FMT_TEXTURE);352353if (!tile_mode) {354/* different from format table when used as linear src */355if (format == VK_FORMAT_R5G5B5A1_UNORM_PACK16)356fmt.fmt = FMT6_1_5_5_5_UNORM, fmt.swap = WXYZ;357if (format == VK_FORMAT_B5G5R5A1_UNORM_PACK16)358fmt.fmt = FMT6_1_5_5_5_UNORM, fmt.swap = WZYX;359} else {360fmt.swap = WZYX;361}362363return fmt;364}365366static void367tu_physical_device_get_format_properties(368struct tu_physical_device *physical_device,369VkFormat format,370VkFormatProperties *out_properties)371{372VkFormatFeatureFlags linear = 0, optimal = 0, buffer = 0;373const struct util_format_description *desc = vk_format_description(format);374const struct tu_native_format native_fmt = tu6_get_native_format(format);375if (!desc || !native_fmt.supported) {376goto end;377}378379buffer |= VK_FORMAT_FEATURE_TRANSFER_SRC_BIT | VK_FORMAT_FEATURE_TRANSFER_DST_BIT;380if (native_fmt.supported & FMT_VERTEX)381buffer |= VK_FORMAT_FEATURE_VERTEX_BUFFER_BIT;382383if (native_fmt.supported & FMT_TEXTURE) {384optimal |= VK_FORMAT_FEATURE_TRANSFER_SRC_BIT |385VK_FORMAT_FEATURE_TRANSFER_DST_BIT |386VK_FORMAT_FEATURE_SAMPLED_IMAGE_BIT |387VK_FORMAT_FEATURE_SAMPLED_IMAGE_FILTER_MINMAX_BIT |388VK_FORMAT_FEATURE_COSITED_CHROMA_SAMPLES_BIT |389VK_FORMAT_FEATURE_MIDPOINT_CHROMA_SAMPLES_BIT;390391buffer |= VK_FORMAT_FEATURE_UNIFORM_TEXEL_BUFFER_BIT;392393/* no blit src bit for YUYV/NV12/I420 formats */394if (desc->layout != UTIL_FORMAT_LAYOUT_SUBSAMPLED &&395desc->layout != UTIL_FORMAT_LAYOUT_PLANAR2 &&396desc->layout != UTIL_FORMAT_LAYOUT_PLANAR3)397optimal |= VK_FORMAT_FEATURE_BLIT_SRC_BIT;398399if (desc->layout != UTIL_FORMAT_LAYOUT_SUBSAMPLED)400optimal |= VK_FORMAT_FEATURE_SAMPLED_IMAGE_YCBCR_CONVERSION_LINEAR_FILTER_BIT;401402if (!vk_format_is_int(format)) {403optimal |= VK_FORMAT_FEATURE_SAMPLED_IMAGE_FILTER_LINEAR_BIT;404405if (physical_device->vk.supported_extensions.EXT_filter_cubic)406optimal |= VK_FORMAT_FEATURE_SAMPLED_IMAGE_FILTER_CUBIC_BIT_EXT;407}408}409410if (native_fmt.supported & FMT_COLOR) {411assert(native_fmt.supported & FMT_TEXTURE);412optimal |= VK_FORMAT_FEATURE_COLOR_ATTACHMENT_BIT |413VK_FORMAT_FEATURE_BLIT_DST_BIT;414415/* IBO's don't have a swap field at all, so swapped formats can't be416* supported, even with linear images.417*418* TODO: See if setting the swap field from the tex descriptor works,419* after we enable shaderStorageImageReadWithoutFormat and there are420* tests for these formats.421*/422if (native_fmt.swap == WZYX) {423optimal |= VK_FORMAT_FEATURE_STORAGE_IMAGE_BIT;424buffer |= VK_FORMAT_FEATURE_STORAGE_TEXEL_BUFFER_BIT;425}426427/* TODO: The blob also exposes these for R16G16_UINT/R16G16_SINT, but we428* don't have any tests for those.429*/430if (format == VK_FORMAT_R32_UINT || format == VK_FORMAT_R32_SINT) {431optimal |= VK_FORMAT_FEATURE_STORAGE_IMAGE_ATOMIC_BIT;432buffer |= VK_FORMAT_FEATURE_STORAGE_TEXEL_BUFFER_ATOMIC_BIT;433}434435if (!vk_format_is_int(format))436optimal |= VK_FORMAT_FEATURE_COLOR_ATTACHMENT_BLEND_BIT;437}438439/* For the most part, we can do anything with a linear image that we could440* do with a tiled image. However, we can't support sysmem rendering with a441* linear depth texture, because we don't know if there's a bit to control442* the tiling of the depth buffer in BYPASS mode, and the blob also443* disables linear depth rendering, so there's no way to discover it. We444* also can't force GMEM mode, because there are other situations where we445* have to use sysmem rendering. So follow the blob here, and only enable446* DEPTH_STENCIL_ATTACHMENT_BIT for the optimal features.447*/448linear = optimal;449if (tu6_pipe2depth(format) != (enum a6xx_depth_format)~0)450optimal |= VK_FORMAT_FEATURE_DEPTH_STENCIL_ATTACHMENT_BIT;451452if (format == VK_FORMAT_G8B8G8R8_422_UNORM ||453format == VK_FORMAT_B8G8R8G8_422_UNORM ||454format == VK_FORMAT_G8_B8R8_2PLANE_420_UNORM ||455format == VK_FORMAT_G8_B8_R8_3PLANE_420_UNORM) {456/* no tiling for special UBWC formats457* TODO: NV12 can be UBWC but has a special UBWC format for accessing the Y plane aspect458* for 3plane, tiling/UBWC might be supported, but the blob doesn't use tiling459*/460optimal = 0;461462/* Disable buffer texturing of subsampled (422) and planar YUV textures.463* The subsampling requirement comes from "If format is a block-compressed464* format, then bufferFeatures must not support any features for the465* format" plus the specification of subsampled as 2x1 compressed block466* format. I couldn't find the citation for planar, but 1D access of467* planar YUV would be really silly.468*/469buffer = 0;470}471472/* D32_SFLOAT_S8_UINT is tiled as two images, so no linear format473* blob enables some linear features, but its not useful, so don't bother.474*/475if (format == VK_FORMAT_D32_SFLOAT_S8_UINT)476linear = 0;477478end:479out_properties->linearTilingFeatures = linear;480out_properties->optimalTilingFeatures = optimal;481out_properties->bufferFeatures = buffer;482}483484VKAPI_ATTR void VKAPI_CALL485tu_GetPhysicalDeviceFormatProperties2(486VkPhysicalDevice physicalDevice,487VkFormat format,488VkFormatProperties2 *pFormatProperties)489{490TU_FROM_HANDLE(tu_physical_device, physical_device, physicalDevice);491492tu_physical_device_get_format_properties(493physical_device, format, &pFormatProperties->formatProperties);494495VkDrmFormatModifierPropertiesListEXT *list =496vk_find_struct(pFormatProperties->pNext, DRM_FORMAT_MODIFIER_PROPERTIES_LIST_EXT);497if (list) {498VK_OUTARRAY_MAKE(out, list->pDrmFormatModifierProperties,499&list->drmFormatModifierCount);500501if (pFormatProperties->formatProperties.linearTilingFeatures) {502vk_outarray_append(&out, mod_props) {503mod_props->drmFormatModifier = DRM_FORMAT_MOD_LINEAR;504mod_props->drmFormatModifierPlaneCount = 1;505}506}507508/* note: ubwc_possible() argument values to be ignored except for format */509if (pFormatProperties->formatProperties.optimalTilingFeatures &&510ubwc_possible(format, VK_IMAGE_TYPE_2D, 0, 0, physical_device->info, VK_SAMPLE_COUNT_1_BIT)) {511vk_outarray_append(&out, mod_props) {512mod_props->drmFormatModifier = DRM_FORMAT_MOD_QCOM_COMPRESSED;513mod_props->drmFormatModifierPlaneCount = 1;514}515}516}517}518519static VkResult520tu_get_image_format_properties(521struct tu_physical_device *physical_device,522const VkPhysicalDeviceImageFormatInfo2 *info,523VkImageFormatProperties *pImageFormatProperties,524VkFormatFeatureFlags *p_feature_flags)525{526VkFormatProperties format_props;527VkFormatFeatureFlags format_feature_flags;528VkExtent3D maxExtent;529uint32_t maxMipLevels;530uint32_t maxArraySize;531VkSampleCountFlags sampleCounts = VK_SAMPLE_COUNT_1_BIT;532533tu_physical_device_get_format_properties(physical_device, info->format,534&format_props);535536switch (info->tiling) {537case VK_IMAGE_TILING_LINEAR:538format_feature_flags = format_props.linearTilingFeatures;539break;540541case VK_IMAGE_TILING_DRM_FORMAT_MODIFIER_EXT: {542const VkPhysicalDeviceImageDrmFormatModifierInfoEXT *drm_info =543vk_find_struct_const(info->pNext, PHYSICAL_DEVICE_IMAGE_DRM_FORMAT_MODIFIER_INFO_EXT);544545switch (drm_info->drmFormatModifier) {546case DRM_FORMAT_MOD_QCOM_COMPRESSED:547/* falling back to linear/non-UBWC isn't possible with explicit modifier */548549/* formats which don't support tiling */550if (!format_props.optimalTilingFeatures)551return VK_ERROR_FORMAT_NOT_SUPPORTED;552553/* for mutable formats, its very unlikely to be possible to use UBWC */554if (info->flags & VK_IMAGE_CREATE_MUTABLE_FORMAT_BIT)555return VK_ERROR_FORMAT_NOT_SUPPORTED;556557558if (!ubwc_possible(info->format, info->type, info->usage, info->usage, physical_device->info, sampleCounts))559return VK_ERROR_FORMAT_NOT_SUPPORTED;560561format_feature_flags = format_props.optimalTilingFeatures;562break;563case DRM_FORMAT_MOD_LINEAR:564format_feature_flags = format_props.linearTilingFeatures;565break;566default:567return VK_ERROR_FORMAT_NOT_SUPPORTED;568}569} break;570case VK_IMAGE_TILING_OPTIMAL:571format_feature_flags = format_props.optimalTilingFeatures;572break;573default:574unreachable("bad VkPhysicalDeviceImageFormatInfo2");575}576577if (format_feature_flags == 0)578goto unsupported;579580if (info->type != VK_IMAGE_TYPE_2D &&581vk_format_is_depth_or_stencil(info->format))582goto unsupported;583584switch (info->type) {585default:586unreachable("bad vkimage type\n");587case VK_IMAGE_TYPE_1D:588maxExtent.width = 16384;589maxExtent.height = 1;590maxExtent.depth = 1;591maxMipLevels = 15; /* log2(maxWidth) + 1 */592maxArraySize = 2048;593break;594case VK_IMAGE_TYPE_2D:595maxExtent.width = 16384;596maxExtent.height = 16384;597maxExtent.depth = 1;598maxMipLevels = 15; /* log2(maxWidth) + 1 */599maxArraySize = 2048;600break;601case VK_IMAGE_TYPE_3D:602maxExtent.width = 2048;603maxExtent.height = 2048;604maxExtent.depth = 2048;605maxMipLevels = 12; /* log2(maxWidth) + 1 */606maxArraySize = 1;607break;608}609610if (info->tiling == VK_IMAGE_TILING_OPTIMAL &&611info->type == VK_IMAGE_TYPE_2D &&612(format_feature_flags &613(VK_FORMAT_FEATURE_COLOR_ATTACHMENT_BIT |614VK_FORMAT_FEATURE_DEPTH_STENCIL_ATTACHMENT_BIT)) &&615!(info->flags & VK_IMAGE_CREATE_CUBE_COMPATIBLE_BIT) &&616!(info->usage & VK_IMAGE_USAGE_STORAGE_BIT)) {617sampleCounts |= VK_SAMPLE_COUNT_2_BIT | VK_SAMPLE_COUNT_4_BIT;618/* note: most operations support 8 samples (GMEM render/resolve do at least)619* but some do not (which ones?), just disable 8 samples completely,620* (no 8x msaa matches the blob driver behavior)621*/622}623624if (info->usage & VK_IMAGE_USAGE_SAMPLED_BIT) {625if (!(format_feature_flags & VK_FORMAT_FEATURE_SAMPLED_IMAGE_BIT)) {626goto unsupported;627}628}629630if (info->usage & VK_IMAGE_USAGE_STORAGE_BIT) {631if (!(format_feature_flags & VK_FORMAT_FEATURE_STORAGE_IMAGE_BIT)) {632goto unsupported;633}634}635636if (info->usage & VK_IMAGE_USAGE_COLOR_ATTACHMENT_BIT) {637if (!(format_feature_flags & VK_FORMAT_FEATURE_COLOR_ATTACHMENT_BIT)) {638goto unsupported;639}640}641642if (info->usage & VK_IMAGE_USAGE_DEPTH_STENCIL_ATTACHMENT_BIT) {643if (!(format_feature_flags &644VK_FORMAT_FEATURE_DEPTH_STENCIL_ATTACHMENT_BIT)) {645goto unsupported;646}647}648649*pImageFormatProperties = (VkImageFormatProperties) {650.maxExtent = maxExtent,651.maxMipLevels = maxMipLevels,652.maxArrayLayers = maxArraySize,653.sampleCounts = sampleCounts,654655/* FINISHME: Accurately calculate656* VkImageFormatProperties::maxResourceSize.657*/658.maxResourceSize = UINT32_MAX,659};660661if (p_feature_flags)662*p_feature_flags = format_feature_flags;663664return VK_SUCCESS;665unsupported:666*pImageFormatProperties = (VkImageFormatProperties) {667.maxExtent = { 0, 0, 0 },668.maxMipLevels = 0,669.maxArrayLayers = 0,670.sampleCounts = 0,671.maxResourceSize = 0,672};673674return VK_ERROR_FORMAT_NOT_SUPPORTED;675}676677static VkResult678tu_get_external_image_format_properties(679const struct tu_physical_device *physical_device,680const VkPhysicalDeviceImageFormatInfo2 *pImageFormatInfo,681VkExternalMemoryHandleTypeFlagBits handleType,682VkExternalMemoryProperties *external_properties)683{684VkExternalMemoryFeatureFlagBits flags = 0;685VkExternalMemoryHandleTypeFlags export_flags = 0;686VkExternalMemoryHandleTypeFlags compat_flags = 0;687688/* From the Vulkan 1.1.98 spec:689*690* If handleType is not compatible with the format, type, tiling,691* usage, and flags specified in VkPhysicalDeviceImageFormatInfo2,692* then vkGetPhysicalDeviceImageFormatProperties2 returns693* VK_ERROR_FORMAT_NOT_SUPPORTED.694*/695696switch (handleType) {697case VK_EXTERNAL_MEMORY_HANDLE_TYPE_OPAQUE_FD_BIT:698case VK_EXTERNAL_MEMORY_HANDLE_TYPE_DMA_BUF_BIT_EXT:699switch (pImageFormatInfo->type) {700case VK_IMAGE_TYPE_2D:701flags = VK_EXTERNAL_MEMORY_FEATURE_DEDICATED_ONLY_BIT |702VK_EXTERNAL_MEMORY_FEATURE_EXPORTABLE_BIT |703VK_EXTERNAL_MEMORY_FEATURE_IMPORTABLE_BIT;704compat_flags = export_flags =705VK_EXTERNAL_MEMORY_HANDLE_TYPE_OPAQUE_FD_BIT |706VK_EXTERNAL_MEMORY_HANDLE_TYPE_DMA_BUF_BIT_EXT;707break;708default:709return vk_errorf(physical_device->instance, VK_ERROR_FORMAT_NOT_SUPPORTED,710"VkExternalMemoryTypeFlagBits(0x%x) unsupported for VkImageType(%d)",711handleType, pImageFormatInfo->type);712}713break;714case VK_EXTERNAL_MEMORY_HANDLE_TYPE_HOST_ALLOCATION_BIT_EXT:715flags = VK_EXTERNAL_MEMORY_FEATURE_IMPORTABLE_BIT;716compat_flags = VK_EXTERNAL_MEMORY_HANDLE_TYPE_HOST_ALLOCATION_BIT_EXT;717break;718default:719return vk_errorf(physical_device->instance, VK_ERROR_FORMAT_NOT_SUPPORTED,720"VkExternalMemoryTypeFlagBits(0x%x) unsupported",721handleType);722}723724*external_properties = (VkExternalMemoryProperties) {725.externalMemoryFeatures = flags,726.exportFromImportedHandleTypes = export_flags,727.compatibleHandleTypes = compat_flags,728};729730return VK_SUCCESS;731}732733VKAPI_ATTR VkResult VKAPI_CALL734tu_GetPhysicalDeviceImageFormatProperties2(735VkPhysicalDevice physicalDevice,736const VkPhysicalDeviceImageFormatInfo2 *base_info,737VkImageFormatProperties2 *base_props)738{739TU_FROM_HANDLE(tu_physical_device, physical_device, physicalDevice);740const VkPhysicalDeviceExternalImageFormatInfo *external_info = NULL;741const VkPhysicalDeviceImageViewImageFormatInfoEXT *image_view_info = NULL;742VkExternalImageFormatProperties *external_props = NULL;743VkFilterCubicImageViewImageFormatPropertiesEXT *cubic_props = NULL;744VkFormatFeatureFlags format_feature_flags;745VkSamplerYcbcrConversionImageFormatProperties *ycbcr_props = NULL;746VkResult result;747748result = tu_get_image_format_properties(physical_device,749base_info, &base_props->imageFormatProperties, &format_feature_flags);750if (result != VK_SUCCESS)751return result;752753/* Extract input structs */754vk_foreach_struct_const(s, base_info->pNext)755{756switch (s->sType) {757case VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_EXTERNAL_IMAGE_FORMAT_INFO:758external_info = (const void *) s;759break;760case VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_IMAGE_VIEW_IMAGE_FORMAT_INFO_EXT:761image_view_info = (const void *) s;762break;763default:764break;765}766}767768/* Extract output structs */769vk_foreach_struct(s, base_props->pNext)770{771switch (s->sType) {772case VK_STRUCTURE_TYPE_EXTERNAL_IMAGE_FORMAT_PROPERTIES:773external_props = (void *) s;774break;775case VK_STRUCTURE_TYPE_FILTER_CUBIC_IMAGE_VIEW_IMAGE_FORMAT_PROPERTIES_EXT:776cubic_props = (void *) s;777break;778case VK_STRUCTURE_TYPE_SAMPLER_YCBCR_CONVERSION_IMAGE_FORMAT_PROPERTIES:779ycbcr_props = (void *) s;780break;781default:782break;783}784}785786/* From the Vulkan 1.0.42 spec:787*788* If handleType is 0, vkGetPhysicalDeviceImageFormatProperties2 will789* behave as if VkPhysicalDeviceExternalImageFormatInfo was not790* present and VkExternalImageFormatProperties will be ignored.791*/792if (external_info && external_info->handleType != 0) {793result = tu_get_external_image_format_properties(794physical_device, base_info, external_info->handleType,795&external_props->externalMemoryProperties);796if (result != VK_SUCCESS)797goto fail;798}799800if (cubic_props) {801/* note: blob only allows cubic filtering for 2D and 2D array views802* its likely we can enable it for 1D and CUBE, needs testing however803*/804if ((image_view_info->imageViewType == VK_IMAGE_VIEW_TYPE_2D ||805image_view_info->imageViewType == VK_IMAGE_VIEW_TYPE_2D_ARRAY) &&806(format_feature_flags & VK_FORMAT_FEATURE_SAMPLED_IMAGE_FILTER_CUBIC_BIT_EXT)) {807cubic_props->filterCubic = true;808cubic_props->filterCubicMinmax = true;809} else {810cubic_props->filterCubic = false;811cubic_props->filterCubicMinmax = false;812}813}814815if (ycbcr_props)816ycbcr_props->combinedImageSamplerDescriptorCount = 1;817818return VK_SUCCESS;819820fail:821if (result == VK_ERROR_FORMAT_NOT_SUPPORTED) {822/* From the Vulkan 1.0.42 spec:823*824* If the combination of parameters to825* vkGetPhysicalDeviceImageFormatProperties2 is not supported by826* the implementation for use in vkCreateImage, then all members of827* imageFormatProperties will be filled with zero.828*/829base_props->imageFormatProperties = (VkImageFormatProperties) {};830}831832return result;833}834835VKAPI_ATTR void VKAPI_CALL836tu_GetPhysicalDeviceSparseImageFormatProperties2(837VkPhysicalDevice physicalDevice,838const VkPhysicalDeviceSparseImageFormatInfo2 *pFormatInfo,839uint32_t *pPropertyCount,840VkSparseImageFormatProperties2 *pProperties)841{842/* Sparse images are not yet supported. */843*pPropertyCount = 0;844}845846VKAPI_ATTR void VKAPI_CALL847tu_GetPhysicalDeviceExternalBufferProperties(848VkPhysicalDevice physicalDevice,849const VkPhysicalDeviceExternalBufferInfo *pExternalBufferInfo,850VkExternalBufferProperties *pExternalBufferProperties)851{852VkExternalMemoryFeatureFlagBits flags = 0;853VkExternalMemoryHandleTypeFlags export_flags = 0;854VkExternalMemoryHandleTypeFlags compat_flags = 0;855switch (pExternalBufferInfo->handleType) {856case VK_EXTERNAL_MEMORY_HANDLE_TYPE_OPAQUE_FD_BIT:857case VK_EXTERNAL_MEMORY_HANDLE_TYPE_DMA_BUF_BIT_EXT:858flags = VK_EXTERNAL_MEMORY_FEATURE_EXPORTABLE_BIT |859VK_EXTERNAL_MEMORY_FEATURE_IMPORTABLE_BIT;860compat_flags = export_flags =861VK_EXTERNAL_MEMORY_HANDLE_TYPE_OPAQUE_FD_BIT |862VK_EXTERNAL_MEMORY_HANDLE_TYPE_DMA_BUF_BIT_EXT;863break;864case VK_EXTERNAL_MEMORY_HANDLE_TYPE_HOST_ALLOCATION_BIT_EXT:865flags = VK_EXTERNAL_MEMORY_FEATURE_IMPORTABLE_BIT;866compat_flags = VK_EXTERNAL_MEMORY_HANDLE_TYPE_HOST_ALLOCATION_BIT_EXT;867break;868default:869break;870}871pExternalBufferProperties->externalMemoryProperties =872(VkExternalMemoryProperties) {873.externalMemoryFeatures = flags,874.exportFromImportedHandleTypes = export_flags,875.compatibleHandleTypes = compat_flags,876};877}878879880