Book a Demo!
CoCalc Logo Icon
StoreFeaturesDocsShareSupportNewsAboutPoliciesSign UpSign In
PojavLauncherTeam
GitHub Repository: PojavLauncherTeam/mesa
Path: blob/21.2-virgl/src/gallium/drivers/llvmpipe/lp_setup_point.c
4570 views
1
/**************************************************************************
2
*
3
* Copyright 2010, VMware Inc.
4
* All Rights Reserved.
5
*
6
* Permission is hereby granted, free of charge, to any person obtaining a
7
* copy of this software and associated documentation files (the
8
* "Software"), to deal in the Software without restriction, including
9
* without limitation the rights to use, copy, modify, merge, publish,
10
* distribute, sub license, and/or sell copies of the Software, and to
11
* permit persons to whom the Software is furnished to do so, subject to
12
* the following conditions:
13
*
14
* The above copyright notice and this permission notice (including the
15
* next paragraph) shall be included in all copies or substantial portions
16
* of the Software.
17
*
18
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
19
* OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20
* MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
21
* IN NO EVENT SHALL VMWARE AND/OR ITS SUPPLIERS BE LIABLE FOR
22
* ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
23
* TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
24
* SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
25
*
26
**************************************************************************/
27
28
/*
29
* Binning code for points
30
*/
31
32
#include "util/u_math.h"
33
#include "util/u_memory.h"
34
#include "lp_setup_context.h"
35
#include "lp_perf.h"
36
#include "lp_rast.h"
37
#include "lp_state_fs.h"
38
#include "lp_state_setup.h"
39
#include "lp_context.h"
40
#include "tgsi/tgsi_scan.h"
41
#include "draw/draw_context.h"
42
43
#define NUM_CHANNELS 4
44
45
struct point_info {
46
/* x,y deltas */
47
int dy01, dy12;
48
int dx01, dx12;
49
50
const float (*v0)[4];
51
52
float (*a0)[4];
53
float (*dadx)[4];
54
float (*dady)[4];
55
56
boolean frontfacing;
57
};
58
59
60
/**
61
* Compute a0 for a constant-valued coefficient (GL_FLAT shading).
62
*/
63
static void
64
constant_coef(struct lp_setup_context *setup,
65
struct point_info *info,
66
unsigned slot,
67
const float value,
68
unsigned i)
69
{
70
info->a0[slot][i] = value;
71
info->dadx[slot][i] = 0.0f;
72
info->dady[slot][i] = 0.0f;
73
}
74
75
76
static void
77
point_persp_coeff(struct lp_setup_context *setup,
78
const struct point_info *info,
79
unsigned slot,
80
unsigned i)
81
{
82
/*
83
* Fragment shader expects pre-multiplied w for LP_INTERP_PERSPECTIVE. A
84
* better strategy would be to take the primitive in consideration when
85
* generating the fragment shader key, and therefore avoid the per-fragment
86
* perspective divide.
87
*/
88
89
float w0 = info->v0[0][3];
90
91
assert(i < 4);
92
93
info->a0[slot][i] = info->v0[slot][i]*w0;
94
info->dadx[slot][i] = 0.0f;
95
info->dady[slot][i] = 0.0f;
96
}
97
98
99
/**
100
* Setup automatic texcoord coefficients (for sprite rendering).
101
* \param slot the vertex attribute slot to setup
102
* \param i the attribute channel in [0,3]
103
* \param sprite_coord_origin one of PIPE_SPRITE_COORD_x
104
* \param perspective does the shader expects pre-multiplied w, i.e.,
105
* LP_INTERP_PERSPECTIVE is specified in the shader key
106
*/
107
static void
108
texcoord_coef(struct lp_setup_context *setup,
109
const struct point_info *info,
110
unsigned slot,
111
unsigned i,
112
unsigned sprite_coord_origin,
113
boolean perspective)
114
{
115
float w0 = info->v0[0][3];
116
117
assert(i < 4);
118
119
if (i == 0) {
120
float dadx = FIXED_ONE / (float)info->dx12;
121
float dady = 0.0f;
122
float x0 = info->v0[0][0] - setup->pixel_offset;
123
float y0 = info->v0[0][1] - setup->pixel_offset;
124
125
info->dadx[slot][0] = dadx;
126
info->dady[slot][0] = dady;
127
info->a0[slot][0] = 0.5 - (dadx * x0 + dady * y0);
128
129
if (perspective) {
130
info->dadx[slot][0] *= w0;
131
info->dady[slot][0] *= w0;
132
info->a0[slot][0] *= w0;
133
}
134
}
135
else if (i == 1) {
136
float dadx = 0.0f;
137
float dady = FIXED_ONE / (float)info->dx12;
138
float x0 = info->v0[0][0] - setup->pixel_offset;
139
float y0 = info->v0[0][1] - setup->pixel_offset;
140
141
if (sprite_coord_origin == PIPE_SPRITE_COORD_LOWER_LEFT) {
142
dady = -dady;
143
}
144
145
info->dadx[slot][1] = dadx;
146
info->dady[slot][1] = dady;
147
info->a0[slot][1] = 0.5 - (dadx * x0 + dady * y0);
148
149
if (perspective) {
150
info->dadx[slot][1] *= w0;
151
info->dady[slot][1] *= w0;
152
info->a0[slot][1] *= w0;
153
}
154
}
155
else if (i == 2) {
156
info->a0[slot][2] = 0.0f;
157
info->dadx[slot][2] = 0.0f;
158
info->dady[slot][2] = 0.0f;
159
}
160
else {
161
info->a0[slot][3] = perspective ? w0 : 1.0f;
162
info->dadx[slot][3] = 0.0f;
163
info->dady[slot][3] = 0.0f;
164
}
165
}
166
167
168
/**
169
* Special coefficient setup for gl_FragCoord.
170
* X and Y are trivial
171
* Z and W are copied from position_coef which should have already been computed.
172
* We could do a bit less work if we'd examine gl_FragCoord's swizzle mask.
173
*/
174
static void
175
setup_point_fragcoord_coef(struct lp_setup_context *setup,
176
struct point_info *info,
177
unsigned slot,
178
unsigned usage_mask)
179
{
180
/*X*/
181
if (usage_mask & TGSI_WRITEMASK_X) {
182
info->a0[slot][0] = 0.0;
183
info->dadx[slot][0] = 1.0;
184
info->dady[slot][0] = 0.0;
185
}
186
187
/*Y*/
188
if (usage_mask & TGSI_WRITEMASK_Y) {
189
info->a0[slot][1] = 0.0;
190
info->dadx[slot][1] = 0.0;
191
info->dady[slot][1] = 1.0;
192
}
193
194
/*Z*/
195
if (usage_mask & TGSI_WRITEMASK_Z) {
196
constant_coef(setup, info, slot, info->v0[0][2], 2);
197
}
198
199
/*W*/
200
if (usage_mask & TGSI_WRITEMASK_W) {
201
constant_coef(setup, info, slot, info->v0[0][3], 3);
202
}
203
}
204
205
206
/**
207
* Compute the point->coef[] array dadx, dady, a0 values.
208
*/
209
static void
210
setup_point_coefficients( struct lp_setup_context *setup,
211
struct point_info *info)
212
{
213
const struct lp_setup_variant_key *key = &setup->setup.variant->key;
214
const struct lp_fragment_shader *shader = setup->fs.current.variant->shader;
215
unsigned fragcoord_usage_mask = TGSI_WRITEMASK_XYZ;
216
unsigned slot;
217
218
/* setup interpolation for all the remaining attributes:
219
*/
220
for (slot = 0; slot < key->num_inputs; slot++) {
221
unsigned vert_attr = key->inputs[slot].src_index;
222
unsigned usage_mask = key->inputs[slot].usage_mask;
223
enum lp_interp interp = key->inputs[slot].interp;
224
boolean perspective = !!(interp == LP_INTERP_PERSPECTIVE);
225
unsigned i;
226
227
if (perspective && usage_mask) {
228
fragcoord_usage_mask |= TGSI_WRITEMASK_W;
229
}
230
231
switch (interp) {
232
case LP_INTERP_POSITION:
233
/*
234
* The generated pixel interpolators will pick up the coeffs from
235
* slot 0, so all need to ensure that the usage mask is covers all
236
* usages.
237
*/
238
fragcoord_usage_mask |= usage_mask;
239
break;
240
241
case LP_INTERP_LINEAR:
242
/* Sprite tex coords may use linear interpolation someday */
243
FALLTHROUGH;
244
case LP_INTERP_PERSPECTIVE: {
245
/* check if the sprite coord flag is set for this attribute.
246
* If so, set it up so it up so x and y vary from 0 to 1.
247
*/
248
bool do_texcoord_coef = false;
249
if (shader->info.base.input_semantic_name[slot] == TGSI_SEMANTIC_PCOORD) {
250
do_texcoord_coef = true;
251
}
252
else if (shader->info.base.input_semantic_name[slot] == TGSI_SEMANTIC_TEXCOORD) {
253
unsigned semantic_index = shader->info.base.input_semantic_index[slot];
254
/* Note that sprite_coord enable is a bitfield of
255
* PIPE_MAX_SHADER_OUTPUTS bits.
256
*/
257
if (semantic_index < PIPE_MAX_SHADER_OUTPUTS &&
258
(setup->sprite_coord_enable & (1u << semantic_index))) {
259
do_texcoord_coef = true;
260
}
261
}
262
if (do_texcoord_coef) {
263
for (i = 0; i < NUM_CHANNELS; i++) {
264
if (usage_mask & (1 << i)) {
265
texcoord_coef(setup, info, slot + 1, i,
266
setup->sprite_coord_origin,
267
perspective);
268
}
269
}
270
break;
271
}
272
}
273
FALLTHROUGH;
274
case LP_INTERP_CONSTANT:
275
for (i = 0; i < NUM_CHANNELS; i++) {
276
if (usage_mask & (1 << i)) {
277
if (perspective) {
278
point_persp_coeff(setup, info, slot+1, i);
279
}
280
else {
281
constant_coef(setup, info, slot+1, info->v0[vert_attr][i], i);
282
}
283
}
284
}
285
break;
286
287
case LP_INTERP_FACING:
288
for (i = 0; i < NUM_CHANNELS; i++)
289
if (usage_mask & (1 << i))
290
constant_coef(setup, info, slot+1,
291
info->frontfacing ? 1.0f : -1.0f, i);
292
break;
293
294
default:
295
assert(0);
296
break;
297
}
298
}
299
300
/* The internal position input is in slot zero:
301
*/
302
setup_point_fragcoord_coef(setup, info, 0,
303
fragcoord_usage_mask);
304
}
305
306
307
static inline int
308
subpixel_snap(float a)
309
{
310
return util_iround(FIXED_ONE * a);
311
}
312
313
/**
314
* Print point vertex attribs (for debug).
315
*/
316
static void
317
print_point(struct lp_setup_context *setup,
318
const float (*v0)[4],
319
const float size)
320
{
321
const struct lp_setup_variant_key *key = &setup->setup.variant->key;
322
uint i;
323
324
debug_printf("llvmpipe point, width %f\n", size);
325
for (i = 0; i < 1 + key->num_inputs; i++) {
326
debug_printf(" v0[%d]: %f %f %f %f\n", i,
327
v0[i][0], v0[i][1], v0[i][2], v0[i][3]);
328
}
329
}
330
331
332
static boolean
333
try_setup_point( struct lp_setup_context *setup,
334
const float (*v0)[4] )
335
{
336
struct llvmpipe_context *lp_context = (struct llvmpipe_context *)setup->pipe;
337
/* x/y positions in fixed point */
338
const struct lp_setup_variant_key *key = &setup->setup.variant->key;
339
const int sizeAttr = setup->psize_slot;
340
float size
341
= (setup->point_size_per_vertex && sizeAttr > 0) ? v0[sizeAttr][0]
342
: setup->point_size;
343
344
if (size > LP_MAX_POINT_WIDTH)
345
size = LP_MAX_POINT_WIDTH;
346
347
/* Yes this is necessary to accurately calculate bounding boxes
348
* with the two fill-conventions we support. GL (normally) ends
349
* up needing a bottom-left fill convention, which requires
350
* slightly different rounding.
351
*/
352
int adj = (setup->bottom_edge_rule != 0) ? 1 : 0;
353
float pixel_offset = setup->multisample ? 0.0 : setup->pixel_offset;
354
struct lp_scene *scene = setup->scene;
355
struct lp_rast_triangle *point;
356
unsigned bytes;
357
struct u_rect bbox;
358
int x[2], y[2];
359
unsigned nr_planes = 4;
360
struct point_info info;
361
unsigned viewport_index = 0;
362
unsigned layer = 0;
363
int fixed_width;
364
365
if (setup->viewport_index_slot > 0) {
366
unsigned *udata = (unsigned*)v0[setup->viewport_index_slot];
367
viewport_index = lp_clamp_viewport_idx(*udata);
368
}
369
if (setup->layer_slot > 0) {
370
layer = *(unsigned*)v0[setup->layer_slot];
371
layer = MIN2(layer, scene->fb_max_layer);
372
}
373
374
if (0)
375
print_point(setup, v0, size);
376
377
/* Bounding rectangle (in pixels) */
378
if (!setup->legacy_points || setup->multisample) {
379
/*
380
* Rasterize points as quads.
381
*/
382
int x0, y0;
383
/* Point size as fixed point integer, remove rounding errors
384
* and gives minimum width for very small points.
385
*/
386
fixed_width = MAX2(FIXED_ONE, subpixel_snap(size));
387
388
x0 = subpixel_snap(v0[0][0] - pixel_offset) - fixed_width/2;
389
y0 = subpixel_snap(v0[0][1] - pixel_offset) - fixed_width/2;
390
391
x[0] = x0;
392
x[1] = x0 + fixed_width;
393
y[0] = y0;
394
y[1] = y0 + fixed_width;
395
bbox.x0 = x[0] >> FIXED_ORDER;
396
bbox.x1 = (x[1] + (FIXED_ONE-1)) >> FIXED_ORDER;
397
bbox.y0 = (y[0] + adj) >> FIXED_ORDER;
398
bbox.y1 = (y[1] + (FIXED_ONE-1) + adj) >> FIXED_ORDER;
399
400
/* Inclusive coordinates:
401
*/
402
bbox.x1--;
403
bbox.y1--;
404
} else {
405
/*
406
* OpenGL legacy rasterization rules for non-sprite points.
407
*
408
* Per OpenGL 2.1 spec, section 3.3.1, "Basic Point Rasterization".
409
*
410
* This type of point rasterization is only available in pre 3.0 contexts
411
* (or compatibility contexts which we don't support) anyway.
412
*/
413
414
const int x0 = subpixel_snap(v0[0][0]);
415
const int y0 = subpixel_snap(v0[0][1]) - adj;
416
417
int int_width;
418
/* Point size as fixed point integer. For GL legacy points
419
* the point size is always a whole integer.
420
*/
421
fixed_width = MAX2(FIXED_ONE,
422
(subpixel_snap(size) + FIXED_ONE/2 - 1) & ~(FIXED_ONE-1));
423
int_width = fixed_width >> FIXED_ORDER;
424
425
assert(setup->pixel_offset != 0);
426
427
if (int_width == 1) {
428
bbox.x0 = x0 >> FIXED_ORDER;
429
bbox.y0 = y0 >> FIXED_ORDER;
430
bbox.x1 = bbox.x0;
431
bbox.y1 = bbox.y0;
432
} else {
433
if (int_width & 1) {
434
/* Odd width */
435
bbox.x0 = (x0 >> FIXED_ORDER) - (int_width - 1)/2;
436
bbox.y0 = (y0 >> FIXED_ORDER) - (int_width - 1)/2;
437
} else {
438
/* Even width */
439
bbox.x0 = ((x0 + FIXED_ONE/2) >> FIXED_ORDER) - int_width/2;
440
bbox.y0 = ((y0 + FIXED_ONE/2) >> FIXED_ORDER) - int_width/2;
441
}
442
443
bbox.x1 = bbox.x0 + int_width - 1;
444
bbox.y1 = bbox.y0 + int_width - 1;
445
}
446
447
x[0] = (bbox.x0 - 1) << 8;
448
x[1] = (bbox.x1 + 1) << 8;
449
y[0] = (bbox.y0 - 1) << 8;
450
y[1] = (bbox.y1 + 1) << 8;
451
}
452
453
if (0) {
454
debug_printf(" bbox: (%i, %i) - (%i, %i)\n",
455
bbox.x0, bbox.y0,
456
bbox.x1, bbox.y1);
457
}
458
459
if (lp_context->active_statistics_queries) {
460
lp_context->pipeline_statistics.c_primitives++;
461
}
462
463
if (!u_rect_test_intersection(&setup->draw_regions[viewport_index], &bbox)) {
464
if (0) debug_printf("offscreen\n");
465
LP_COUNT(nr_culled_tris);
466
return TRUE;
467
}
468
469
u_rect_find_intersection(&setup->draw_regions[viewport_index], &bbox);
470
471
point = lp_setup_alloc_triangle(scene,
472
key->num_inputs,
473
nr_planes,
474
&bytes);
475
if (!point)
476
return FALSE;
477
478
#ifdef DEBUG
479
point->v[0][0] = v0[0][0];
480
point->v[0][1] = v0[0][1];
481
#endif
482
483
LP_COUNT(nr_tris);
484
485
if (draw_will_inject_frontface(lp_context->draw) &&
486
setup->face_slot > 0) {
487
point->inputs.frontfacing = v0[setup->face_slot][0];
488
} else {
489
point->inputs.frontfacing = TRUE;
490
}
491
492
info.v0 = v0;
493
info.dx01 = 0;
494
info.dx12 = fixed_width;
495
info.dy01 = fixed_width;
496
info.dy12 = 0;
497
info.a0 = GET_A0(&point->inputs);
498
info.dadx = GET_DADX(&point->inputs);
499
info.dady = GET_DADY(&point->inputs);
500
info.frontfacing = point->inputs.frontfacing;
501
502
/* Setup parameter interpolants:
503
*/
504
setup_point_coefficients(setup, &info);
505
506
point->inputs.disable = FALSE;
507
point->inputs.opaque = FALSE;
508
point->inputs.layer = layer;
509
point->inputs.viewport_index = viewport_index;
510
point->inputs.view_index = setup->view_index;
511
512
{
513
struct lp_rast_plane *plane = GET_PLANES(point);
514
515
plane[0].dcdx = ~0U << 8;
516
plane[0].dcdy = 0;
517
plane[0].c = -x[0];
518
plane[0].eo = 1 << 8;
519
520
plane[1].dcdx = 1 << 8;
521
plane[1].dcdy = 0;
522
plane[1].c = x[1];
523
plane[1].eo = 0;
524
525
plane[2].dcdx = 0;
526
plane[2].dcdy = 1 << 8;
527
plane[2].c = -y[0];
528
plane[2].eo = 1 << 8;
529
530
plane[3].dcdx = 0;
531
plane[3].dcdy = ~0U << 8;
532
plane[3].c = y[1];
533
plane[3].eo = 0;
534
535
if (!setup->legacy_points || setup->multisample) {
536
/* adjust for fill-rule*/
537
plane[0].c++; /* left */
538
if (setup->bottom_edge_rule == 0)
539
plane[2].c++; /* top-left */
540
else
541
plane[3].c++; /* bottom-left */
542
}
543
}
544
545
return lp_setup_bin_triangle(setup, point, &bbox, &bbox, nr_planes, viewport_index);
546
}
547
548
549
static void
550
lp_setup_point_discard(struct lp_setup_context *setup,
551
const float (*v0)[4])
552
{
553
}
554
555
static void
556
lp_setup_point(struct lp_setup_context *setup,
557
const float (*v0)[4])
558
{
559
if (!try_setup_point(setup, v0)) {
560
if (!lp_setup_flush_and_restart(setup))
561
return;
562
563
if (!try_setup_point(setup, v0))
564
return;
565
}
566
}
567
568
569
void
570
lp_setup_choose_point(struct lp_setup_context *setup)
571
{
572
if (setup->rasterizer_discard) {
573
setup->point = lp_setup_point_discard;
574
} else {
575
setup->point = lp_setup_point;
576
}
577
}
578
579
580
581