Book a Demo!
CoCalc Logo Icon
StoreFeaturesDocsShareSupportNewsAboutPoliciesSign UpSign In
PojavLauncherTeam
GitHub Repository: PojavLauncherTeam/mesa
Path: blob/21.2-virgl/src/amd/vulkan/radv_meta_dcc_retile.c
7326 views
1
/*
2
* Copyright © 2021 Google
3
*
4
* Permission is hereby granted, free of charge, to any person obtaining a
5
* copy of this software and associated documentation files (the "Software"),
6
* to deal in the Software without restriction, including without limitation
7
* the rights to use, copy, modify, merge, publish, distribute, sublicense,
8
* and/or sell copies of the Software, and to permit persons to whom the
9
* Software is furnished to do so, subject to the following conditions:
10
*
11
* The above copyright notice and this permission notice (including the next
12
* paragraph) shall be included in all copies or substantial portions of the
13
* Software.
14
*
15
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18
* THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19
* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20
* FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
21
* IN THE SOFTWARE.
22
*/
23
24
#define AC_SURFACE_INCLUDE_NIR
25
#include "ac_surface.h"
26
27
#include "radv_meta.h"
28
#include "radv_private.h"
29
30
static nir_ssa_def *
31
get_global_ids(nir_builder *b, unsigned num_components)
32
{
33
unsigned mask = BITFIELD_MASK(num_components);
34
35
nir_ssa_def *local_ids = nir_channels(b, nir_load_local_invocation_id(b), mask);
36
nir_ssa_def *block_ids = nir_channels(b, nir_load_workgroup_id(b, 32), mask);
37
nir_ssa_def *block_size = nir_channels(
38
b,
39
nir_imm_ivec4(b, b->shader->info.workgroup_size[0], b->shader->info.workgroup_size[1],
40
b->shader->info.workgroup_size[2], 0),
41
mask);
42
43
return nir_iadd(b, nir_imul(b, block_ids, block_size), local_ids);
44
}
45
46
static nir_shader *
47
build_dcc_retile_compute_shader(struct radv_device *dev, struct radeon_surf *surf)
48
{
49
const struct glsl_type *buf_type = glsl_image_type(GLSL_SAMPLER_DIM_BUF, false, GLSL_TYPE_UINT);
50
nir_builder b = nir_builder_init_simple_shader(MESA_SHADER_COMPUTE, NULL, "dcc_retile_compute");
51
52
b.shader->info.workgroup_size[0] = 8;
53
b.shader->info.workgroup_size[1] = 8;
54
b.shader->info.workgroup_size[2] = 1;
55
56
nir_ssa_def *src_dcc_size = nir_load_push_constant(&b, 2, 32, nir_imm_int(&b, 0), .range = 8);
57
nir_ssa_def *src_dcc_pitch = nir_channels(&b, src_dcc_size, 1);
58
nir_ssa_def *src_dcc_height = nir_channels(&b, src_dcc_size, 2);
59
60
nir_ssa_def *dst_dcc_size = nir_load_push_constant(&b, 2, 32, nir_imm_int(&b, 8), .range = 8);
61
nir_ssa_def *dst_dcc_pitch = nir_channels(&b, dst_dcc_size, 1);
62
nir_ssa_def *dst_dcc_height = nir_channels(&b, dst_dcc_size, 2);
63
nir_variable *input_dcc = nir_variable_create(b.shader, nir_var_uniform, buf_type, "dcc_in");
64
input_dcc->data.descriptor_set = 0;
65
input_dcc->data.binding = 0;
66
nir_variable *output_dcc = nir_variable_create(b.shader, nir_var_uniform, buf_type, "dcc_out");
67
output_dcc->data.descriptor_set = 0;
68
output_dcc->data.binding = 1;
69
70
nir_ssa_def *input_dcc_ref = &nir_build_deref_var(&b, input_dcc)->dest.ssa;
71
nir_ssa_def *output_dcc_ref = &nir_build_deref_var(&b, output_dcc)->dest.ssa;
72
73
nir_ssa_def *coord = get_global_ids(&b, 2);
74
nir_ssa_def *zero = nir_imm_int(&b, 0);
75
coord = nir_imul(
76
&b, coord,
77
nir_imm_ivec2(&b, surf->u.gfx9.color.dcc_block_width, surf->u.gfx9.color.dcc_block_height));
78
79
nir_ssa_def *src = ac_nir_dcc_addr_from_coord(&b, &dev->physical_device->rad_info, surf->bpe,
80
&surf->u.gfx9.color.dcc_equation, src_dcc_pitch,
81
src_dcc_height, zero, nir_channel(&b, coord, 0),
82
nir_channel(&b, coord, 1), zero, zero, zero);
83
nir_ssa_def *dst = ac_nir_dcc_addr_from_coord(
84
&b, &dev->physical_device->rad_info, surf->bpe, &surf->u.gfx9.color.display_dcc_equation,
85
dst_dcc_pitch, dst_dcc_height, zero, nir_channel(&b, coord, 0), nir_channel(&b, coord, 1),
86
zero, zero, zero);
87
88
nir_intrinsic_instr *dcc_val =
89
nir_intrinsic_instr_create(b.shader, nir_intrinsic_image_deref_load);
90
dcc_val->num_components = 1;
91
dcc_val->src[0] = nir_src_for_ssa(input_dcc_ref);
92
dcc_val->src[1] = nir_src_for_ssa(nir_vec4(&b, src, src, src, src));
93
dcc_val->src[2] = nir_src_for_ssa(nir_ssa_undef(&b, 1, 32));
94
dcc_val->src[3] = nir_src_for_ssa(nir_imm_int(&b, 0));
95
nir_ssa_dest_init(&dcc_val->instr, &dcc_val->dest, 1, 32, "dcc_val");
96
nir_builder_instr_insert(&b, &dcc_val->instr);
97
98
nir_intrinsic_instr *store =
99
nir_intrinsic_instr_create(b.shader, nir_intrinsic_image_deref_store);
100
store->num_components = 1;
101
store->src[0] = nir_src_for_ssa(output_dcc_ref);
102
store->src[1] = nir_src_for_ssa(nir_vec4(&b, dst, dst, dst, dst));
103
store->src[2] = nir_src_for_ssa(nir_ssa_undef(&b, 1, 32));
104
store->src[3] = nir_src_for_ssa(&dcc_val->dest.ssa);
105
store->src[4] = nir_src_for_ssa(nir_imm_int(&b, 0));
106
107
nir_builder_instr_insert(&b, &store->instr);
108
return b.shader;
109
}
110
111
void
112
radv_device_finish_meta_dcc_retile_state(struct radv_device *device)
113
{
114
struct radv_meta_state *state = &device->meta_state;
115
116
radv_DestroyPipeline(radv_device_to_handle(device), state->dcc_retile.pipeline, &state->alloc);
117
radv_DestroyPipelineLayout(radv_device_to_handle(device), state->dcc_retile.p_layout,
118
&state->alloc);
119
radv_DestroyDescriptorSetLayout(radv_device_to_handle(device), state->dcc_retile.ds_layout,
120
&state->alloc);
121
122
/* Reset for next finish. */
123
memset(&state->dcc_retile, 0, sizeof(state->dcc_retile));
124
}
125
126
/*
127
* This take a surface, but the only things used are:
128
* - BPE
129
* - DCC equations
130
* - DCC block size
131
*
132
* BPE is always 4 at the moment and the rest is derived from the tilemode,
133
* and ac_surface limits displayable DCC to at most 1 tiling mode. So in effect
134
* this shader is indepedent of the surface.
135
*/
136
static VkResult
137
radv_device_init_meta_dcc_retile_state(struct radv_device *device, struct radeon_surf *surf)
138
{
139
VkResult result = VK_SUCCESS;
140
nir_shader *cs = build_dcc_retile_compute_shader(device, surf);
141
142
VkDescriptorSetLayoutCreateInfo ds_create_info = {
143
.sType = VK_STRUCTURE_TYPE_DESCRIPTOR_SET_LAYOUT_CREATE_INFO,
144
.flags = VK_DESCRIPTOR_SET_LAYOUT_CREATE_PUSH_DESCRIPTOR_BIT_KHR,
145
.bindingCount = 2,
146
.pBindings = (VkDescriptorSetLayoutBinding[]){
147
{.binding = 0,
148
.descriptorType = VK_DESCRIPTOR_TYPE_STORAGE_TEXEL_BUFFER,
149
.descriptorCount = 1,
150
.stageFlags = VK_SHADER_STAGE_COMPUTE_BIT,
151
.pImmutableSamplers = NULL},
152
{.binding = 1,
153
.descriptorType = VK_DESCRIPTOR_TYPE_STORAGE_TEXEL_BUFFER,
154
.descriptorCount = 1,
155
.stageFlags = VK_SHADER_STAGE_COMPUTE_BIT,
156
.pImmutableSamplers = NULL},
157
}};
158
159
result = radv_CreateDescriptorSetLayout(radv_device_to_handle(device), &ds_create_info,
160
&device->meta_state.alloc,
161
&device->meta_state.dcc_retile.ds_layout);
162
if (result != VK_SUCCESS)
163
goto cleanup;
164
165
VkPipelineLayoutCreateInfo pl_create_info = {
166
.sType = VK_STRUCTURE_TYPE_PIPELINE_LAYOUT_CREATE_INFO,
167
.setLayoutCount = 1,
168
.pSetLayouts = &device->meta_state.dcc_retile.ds_layout,
169
.pushConstantRangeCount = 1,
170
.pPushConstantRanges = &(VkPushConstantRange){VK_SHADER_STAGE_COMPUTE_BIT, 0, 16},
171
};
172
173
result =
174
radv_CreatePipelineLayout(radv_device_to_handle(device), &pl_create_info,
175
&device->meta_state.alloc, &device->meta_state.dcc_retile.p_layout);
176
if (result != VK_SUCCESS)
177
goto cleanup;
178
179
/* compute shader */
180
181
VkPipelineShaderStageCreateInfo pipeline_shader_stage = {
182
.sType = VK_STRUCTURE_TYPE_PIPELINE_SHADER_STAGE_CREATE_INFO,
183
.stage = VK_SHADER_STAGE_COMPUTE_BIT,
184
.module = vk_shader_module_handle_from_nir(cs),
185
.pName = "main",
186
.pSpecializationInfo = NULL,
187
};
188
189
VkComputePipelineCreateInfo vk_pipeline_info = {
190
.sType = VK_STRUCTURE_TYPE_COMPUTE_PIPELINE_CREATE_INFO,
191
.stage = pipeline_shader_stage,
192
.flags = 0,
193
.layout = device->meta_state.dcc_retile.p_layout,
194
};
195
196
result = radv_CreateComputePipelines(
197
radv_device_to_handle(device), radv_pipeline_cache_to_handle(&device->meta_state.cache), 1,
198
&vk_pipeline_info, NULL, &device->meta_state.dcc_retile.pipeline);
199
if (result != VK_SUCCESS)
200
goto cleanup;
201
202
cleanup:
203
if (result != VK_SUCCESS)
204
radv_device_finish_meta_dcc_retile_state(device);
205
ralloc_free(cs);
206
return result;
207
}
208
209
void
210
radv_retile_dcc(struct radv_cmd_buffer *cmd_buffer, struct radv_image *image)
211
{
212
struct radv_meta_saved_state saved_state;
213
struct radv_device *device = cmd_buffer->device;
214
215
assert(image->type == VK_IMAGE_TYPE_2D);
216
assert(image->info.array_size == 1 && image->info.levels == 1);
217
218
struct radv_cmd_state *state = &cmd_buffer->state;
219
220
state->flush_bits |= radv_dst_access_flush(cmd_buffer, VK_ACCESS_SHADER_READ_BIT, image) |
221
radv_dst_access_flush(cmd_buffer, VK_ACCESS_SHADER_WRITE_BIT, image);
222
223
/* Compile pipelines if not already done so. */
224
if (!cmd_buffer->device->meta_state.dcc_retile.pipeline) {
225
VkResult ret =
226
radv_device_init_meta_dcc_retile_state(cmd_buffer->device, &image->planes[0].surface);
227
if (ret != VK_SUCCESS) {
228
cmd_buffer->record_result = ret;
229
return;
230
}
231
}
232
233
radv_meta_save(
234
&saved_state, cmd_buffer,
235
RADV_META_SAVE_DESCRIPTORS | RADV_META_SAVE_COMPUTE_PIPELINE | RADV_META_SAVE_CONSTANTS);
236
237
radv_CmdBindPipeline(radv_cmd_buffer_to_handle(cmd_buffer), VK_PIPELINE_BIND_POINT_COMPUTE,
238
device->meta_state.dcc_retile.pipeline);
239
240
struct radv_buffer buffer = {.size = image->size, .bo = image->bo, .offset = image->offset};
241
242
struct radv_buffer_view views[2];
243
VkBufferView view_handles[2];
244
radv_buffer_view_init(views, cmd_buffer->device,
245
&(VkBufferViewCreateInfo){
246
.sType = VK_STRUCTURE_TYPE_BUFFER_VIEW_CREATE_INFO,
247
.buffer = radv_buffer_to_handle(&buffer),
248
.offset = image->planes[0].surface.meta_offset,
249
.range = image->planes[0].surface.meta_size,
250
.format = VK_FORMAT_R8_UINT,
251
});
252
radv_buffer_view_init(views + 1, cmd_buffer->device,
253
&(VkBufferViewCreateInfo){
254
.sType = VK_STRUCTURE_TYPE_BUFFER_VIEW_CREATE_INFO,
255
.buffer = radv_buffer_to_handle(&buffer),
256
.offset = image->planes[0].surface.display_dcc_offset,
257
.range = image->planes[0].surface.u.gfx9.color.display_dcc_size,
258
.format = VK_FORMAT_R8_UINT,
259
});
260
for (unsigned i = 0; i < 2; ++i)
261
view_handles[i] = radv_buffer_view_to_handle(&views[i]);
262
263
radv_meta_push_descriptor_set(cmd_buffer, VK_PIPELINE_BIND_POINT_COMPUTE,
264
device->meta_state.dcc_retile.p_layout, 0, /* set */
265
2, /* descriptorWriteCount */
266
(VkWriteDescriptorSet[]){
267
{
268
.sType = VK_STRUCTURE_TYPE_WRITE_DESCRIPTOR_SET,
269
.dstBinding = 0,
270
.dstArrayElement = 0,
271
.descriptorCount = 1,
272
.descriptorType = VK_DESCRIPTOR_TYPE_STORAGE_TEXEL_BUFFER,
273
.pTexelBufferView = &view_handles[0],
274
},
275
{
276
.sType = VK_STRUCTURE_TYPE_WRITE_DESCRIPTOR_SET,
277
.dstBinding = 1,
278
.dstArrayElement = 0,
279
.descriptorCount = 1,
280
.descriptorType = VK_DESCRIPTOR_TYPE_STORAGE_TEXEL_BUFFER,
281
.pTexelBufferView = &view_handles[1],
282
},
283
});
284
285
unsigned width = DIV_ROUND_UP(image->info.width, vk_format_get_blockwidth(image->vk_format));
286
unsigned height = DIV_ROUND_UP(image->info.height, vk_format_get_blockheight(image->vk_format));
287
288
unsigned dcc_width = DIV_ROUND_UP(width, image->planes[0].surface.u.gfx9.color.dcc_block_width);
289
unsigned dcc_height =
290
DIV_ROUND_UP(height, image->planes[0].surface.u.gfx9.color.dcc_block_height);
291
292
uint32_t constants[] = {
293
image->planes[0].surface.u.gfx9.color.dcc_pitch_max + 1,
294
image->planes[0].surface.u.gfx9.color.dcc_height,
295
image->planes[0].surface.u.gfx9.color.display_dcc_pitch_max + 1,
296
image->planes[0].surface.u.gfx9.color.display_dcc_height,
297
};
298
radv_CmdPushConstants(radv_cmd_buffer_to_handle(cmd_buffer),
299
device->meta_state.dcc_retile.p_layout, VK_SHADER_STAGE_COMPUTE_BIT, 0, 16,
300
constants);
301
302
radv_unaligned_dispatch(cmd_buffer, dcc_width, dcc_height, 1);
303
304
radv_meta_restore(&saved_state, cmd_buffer);
305
306
state->flush_bits |= RADV_CMD_FLAG_CS_PARTIAL_FLUSH |
307
radv_src_access_flush(cmd_buffer, VK_ACCESS_SHADER_WRITE_BIT, image);
308
}
309
310