CoCalc -- svga_pipe

GitHub Repository: PojavLauncherTeam/mesa
Path: blob/21.2-virgl/src/gallium/drivers/svga/svga_pipe_query.c
⁴⁵⁷⁰ views
1
/**********************************************************
2
 * Copyright 2008-2015 VMware, Inc.  All rights reserved.
3
 *
4
 * Permission is hereby granted, free of charge, to any person
5
 * obtaining a copy of this software and associated documentation
6
 * files (the "Software"), to deal in the Software without
7
 * restriction, including without limitation the rights to use, copy,
8
 * modify, merge, publish, distribute, sublicense, and/or sell copies
9
 * of the Software, and to permit persons to whom the Software is
10
 * furnished to do so, subject to the following conditions:
11
 *
12
 * The above copyright notice and this permission notice shall be
13
 * included in all copies or substantial portions of the Software.
14
 *
15
 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
16
 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
17
 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
18
 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
19
 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
20
 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
21
 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
22
 * SOFTWARE.
23
 *
24
 **********************************************************/
25

26
#include "pipe/p_state.h"
27
#include "pipe/p_context.h"
28

29
#include "util/u_bitmask.h"
30
#include "util/u_memory.h"
31

32
#include "svga_cmd.h"
33
#include "svga_context.h"
34
#include "svga_screen.h"
35
#include "svga_resource_buffer.h"
36
#include "svga_winsys.h"
37
#include "svga_debug.h"
38

39

40
/* Fixme: want a public base class for all pipe structs, even if there
41
 * isn't much in them.
42
 */
43
struct pipe_query {
44
   int dummy;
45
};
46

47
struct svga_query {
48
   struct pipe_query base;
49
   unsigned type;                  /**< PIPE_QUERY_x or SVGA_QUERY_x */
50
   SVGA3dQueryType svga_type;      /**< SVGA3D_QUERYTYPE_x or unused */
51

52
   unsigned id;                    /** Per-context query identifier */
53
   boolean active;                 /** TRUE if query is active */
54

55
   struct pipe_fence_handle *fence;
56

57
   /** For PIPE_QUERY_OCCLUSION_COUNTER / SVGA3D_QUERYTYPE_OCCLUSION */
58

59
   /* For VGPU9 */
60
   struct svga_winsys_buffer *hwbuf;
61
   volatile SVGA3dQueryResult *queryResult;
62

63
   /** For VGPU10 */
64
   struct svga_winsys_gb_query *gb_query;
65
   SVGA3dDXQueryFlags flags;
66
   unsigned offset;                /**< offset to the gb_query memory */
67
   struct pipe_query *predicate;   /** The associated query that can be used for predicate */
68

69
   /** For non-GPU SVGA_QUERY_x queries */
70
   uint64_t begin_count, end_count;
71
};
72

73

74
/** cast wrapper */
75
static inline struct svga_query *
76
svga_query(struct pipe_query *q)
77
{
78
   return (struct svga_query *)q;
79
}
80

81
/**
82
 * VGPU9
83
 */
84

85
static bool
86
svga_get_query_result(struct pipe_context *pipe,
87
                      struct pipe_query *q,
88
                      bool wait,
89
                      union pipe_query_result *result);
90

91
static enum pipe_error
92
define_query_vgpu9(struct svga_context *svga,
93
                   struct svga_query *sq)
94
{
95
   struct svga_winsys_screen *sws = svga_screen(svga->pipe.screen)->sws;
96

97
   sq->hwbuf = svga_winsys_buffer_create(svga, 1,
98
                                         SVGA_BUFFER_USAGE_PINNED,
99
                                         sizeof *sq->queryResult);
100
   if (!sq->hwbuf)
101
      return PIPE_ERROR_OUT_OF_MEMORY;
102

103
   sq->queryResult = (SVGA3dQueryResult *)
104
                     sws->buffer_map(sws, sq->hwbuf, PIPE_MAP_WRITE);
105
   if (!sq->queryResult) {
106
      sws->buffer_destroy(sws, sq->hwbuf);
107
      return PIPE_ERROR_OUT_OF_MEMORY;
108
   }
109

110
   sq->queryResult->totalSize = sizeof *sq->queryResult;
111
   sq->queryResult->state = SVGA3D_QUERYSTATE_NEW;
112

113
   /* We request the buffer to be pinned and assume it is always mapped.
114
    * The reason is that we don't want to wait for fences when checking the
115
    * query status.
116
    */
117
   sws->buffer_unmap(sws, sq->hwbuf);
118

119
   return PIPE_OK;
120
}
121

122
static void
123
begin_query_vgpu9(struct svga_context *svga, struct svga_query *sq)
124
{
125
   struct svga_winsys_screen *sws = svga_screen(svga->pipe.screen)->sws;
126

127
   if (sq->queryResult->state == SVGA3D_QUERYSTATE_PENDING) {
128
      /* The application doesn't care for the pending query result.
129
       * We cannot let go of the existing buffer and just get a new one
130
       * because its storage may be reused for other purposes and clobbered
131
       * by the host when it determines the query result.  So the only
132
       * option here is to wait for the existing query's result -- not a
133
       * big deal, given that no sane application would do this.
134
       */
135
       uint64_t result;
136
       svga_get_query_result(&svga->pipe, &sq->base, TRUE, (void*)&result);
137
       assert(sq->queryResult->state != SVGA3D_QUERYSTATE_PENDING);
138
   }
139

140
   sq->queryResult->state = SVGA3D_QUERYSTATE_NEW;
141
   sws->fence_reference(sws, &sq->fence, NULL);
142

143
   SVGA_RETRY(svga, SVGA3D_BeginQuery(svga->swc, sq->svga_type));
144
}
145

146
static void
147
end_query_vgpu9(struct svga_context *svga, struct svga_query *sq)
148
{
149
   /* Set to PENDING before sending EndQuery. */
150
   sq->queryResult->state = SVGA3D_QUERYSTATE_PENDING;
151

152
   SVGA_RETRY(svga, SVGA3D_EndQuery(svga->swc, sq->svga_type, sq->hwbuf));
153
}
154

155
static bool
156
get_query_result_vgpu9(struct svga_context *svga, struct svga_query *sq,
157
                       bool wait, uint64_t *result)
158
{
159
   struct svga_winsys_screen *sws = svga_screen(svga->pipe.screen)->sws;
160
   SVGA3dQueryState state;
161

162
   if (!sq->fence) {
163
      /* The query status won't be updated by the host unless
164
       * SVGA_3D_CMD_WAIT_FOR_QUERY is emitted. Unfortunately this will cause
165
       * a synchronous wait on the host.
166
       */
167
      SVGA_RETRY(svga, SVGA3D_WaitForQuery(svga->swc, sq->svga_type,
168
                                           sq->hwbuf));
169
      svga_context_flush(svga, &sq->fence);
170
      assert(sq->fence);
171
   }
172

173
   state = sq->queryResult->state;
174
   if (state == SVGA3D_QUERYSTATE_PENDING) {
175
      if (!wait)
176
         return false;
177
      sws->fence_finish(sws, sq->fence, PIPE_TIMEOUT_INFINITE,
178
                        SVGA_FENCE_FLAG_QUERY);
179
      state = sq->queryResult->state;
180
   }
181

182
   assert(state == SVGA3D_QUERYSTATE_SUCCEEDED ||
183
          state == SVGA3D_QUERYSTATE_FAILED);
184

185
   *result = (uint64_t)sq->queryResult->result32;
186
   return true;
187
}
188

189

190
/**
191
 * VGPU10
192
 *
193
 * There is one query mob allocated for each context to be shared by all
194
 * query types. The mob is used to hold queries's state and result. Since
195
 * each query result type is of different length, to ease the query allocation
196
 * management, the mob is divided into memory blocks. Each memory block
197
 * will hold queries of the same type. Multiple memory blocks can be allocated
198
 * for a particular query type.
199
 *
200
 * Currently each memory block is of 184 bytes. We support up to 512
201
 * memory blocks. The query memory size is arbitrary right now.
202
 * Each occlusion query takes about 8 bytes. One memory block can accomodate
203
 * 23 occlusion queries. 512 of those blocks can support up to 11K occlusion
204
 * queries. That seems reasonable for now. If we think this limit is
205
 * not enough, we can increase the limit or try to grow the mob in runtime.
206
 * Note, SVGA device does not impose one mob per context for queries,
207
 * we could allocate multiple mobs for queries; however, wddm KMD does not
208
 * currently support that.
209
 *
210
 * Also note that the GL guest driver does not issue any of the
211
 * following commands: DXMoveQuery, DXBindAllQuery & DXReadbackAllQuery.
212
 */
213
#define SVGA_QUERY_MEM_BLOCK_SIZE    (sizeof(SVGADXQueryResultUnion) * 2)
214
#define SVGA_QUERY_MEM_SIZE          (512 * SVGA_QUERY_MEM_BLOCK_SIZE)
215

216
struct svga_qmem_alloc_entry
217
{
218
   unsigned start_offset;               /* start offset of the memory block */
219
   unsigned block_index;                /* block index of the memory block */
220
   unsigned query_size;                 /* query size in this memory block */
221
   unsigned nquery;                     /* number of queries allocated */
222
   struct util_bitmask *alloc_mask;     /* allocation mask */
223
   struct svga_qmem_alloc_entry *next;  /* next memory block */
224
};
225

226

227
/**
228
 * Allocate a memory block from the query object memory
229
 * \return NULL if out of memory, else pointer to the query memory block
230
 */
231
static struct svga_qmem_alloc_entry *
232
allocate_query_block(struct svga_context *svga)
233
{
234
   int index;
235
   unsigned offset;
236
   struct svga_qmem_alloc_entry *alloc_entry = NULL;
237

238
   /* Find the next available query block */
239
   index = util_bitmask_add(svga->gb_query_alloc_mask);
240

241
   if (index == UTIL_BITMASK_INVALID_INDEX)
242
      return NULL;
243

244
   offset = index * SVGA_QUERY_MEM_BLOCK_SIZE;
245
   if (offset >= svga->gb_query_len) {
246
      unsigned i;
247

248
      /* Deallocate the out-of-range index */
249
      util_bitmask_clear(svga->gb_query_alloc_mask, index);
250
      index = -1;
251

252
      /**
253
       * All the memory blocks are allocated, lets see if there is
254
       * any empty memory block around that can be freed up.
255
       */
256
      for (i = 0; i < SVGA3D_QUERYTYPE_MAX && index == -1; i++) {
257
         struct svga_qmem_alloc_entry *prev_alloc_entry = NULL;
258

259
         alloc_entry = svga->gb_query_map[i];
260
         while (alloc_entry && index == -1) {
261
            if (alloc_entry->nquery == 0) {
262
               /* This memory block is empty, it can be recycled. */
263
               if (prev_alloc_entry) {
264
                  prev_alloc_entry->next = alloc_entry->next;
265
               } else {
266
                  svga->gb_query_map[i] = alloc_entry->next;
267
               }
268
               index = alloc_entry->block_index;
269
            } else {
270
               prev_alloc_entry = alloc_entry;
271
               alloc_entry = alloc_entry->next;
272
            }
273
         }
274
      }
275

276
      if (index == -1) {
277
         debug_printf("Query memory object is full\n");
278
         return NULL;
279
      }
280
   }
281

282
   if (!alloc_entry) {
283
      assert(index != -1);
284
      alloc_entry = CALLOC_STRUCT(svga_qmem_alloc_entry);
285
      alloc_entry->block_index = index;
286
   }
287

288
   return alloc_entry;
289
}
290

291
/**
292
 * Allocate a slot in the specified memory block.
293
 * All slots in this memory block are of the same size.
294
 *
295
 * \return -1 if out of memory, else index of the query slot
296
 */
297
static int
298
allocate_query_slot(struct svga_context *svga,
299
                    struct svga_qmem_alloc_entry *alloc)
300
{
301
   int index;
302
   unsigned offset;
303

304
   /* Find the next available slot */
305
   index = util_bitmask_add(alloc->alloc_mask);
306

307
   if (index == UTIL_BITMASK_INVALID_INDEX)
308
      return -1;
309

310
   offset = index * alloc->query_size;
311
   if (offset >= SVGA_QUERY_MEM_BLOCK_SIZE)
312
      return -1;
313

314
   alloc->nquery++;
315

316
   return index;
317
}
318

319
/**
320
 * Deallocate the specified slot in the memory block.
321
 * If all slots are freed up, then deallocate the memory block
322
 * as well, so it can be allocated for other query type
323
 */
324
static void
325
deallocate_query_slot(struct svga_context *svga,
326
                      struct svga_qmem_alloc_entry *alloc,
327
                      unsigned index)
328
{
329
   assert(index != UTIL_BITMASK_INVALID_INDEX);
330

331
   util_bitmask_clear(alloc->alloc_mask, index);
332
   alloc->nquery--;
333

334
   /**
335
    * Don't worry about deallocating the empty memory block here.
336
    * The empty memory block will be recycled when no more memory block
337
    * can be allocated.
338
    */
339
}
340

341
static struct svga_qmem_alloc_entry *
342
allocate_query_block_entry(struct svga_context *svga,
343
                           unsigned len)
344
{
345
   struct svga_qmem_alloc_entry *alloc_entry;
346

347
   alloc_entry = allocate_query_block(svga);
348
   if (!alloc_entry)
349
      return NULL;
350

351
   assert(alloc_entry->block_index != -1);
352
   alloc_entry->start_offset =
353
      alloc_entry->block_index * SVGA_QUERY_MEM_BLOCK_SIZE;
354
   alloc_entry->nquery = 0;
355
   alloc_entry->alloc_mask = util_bitmask_create();
356
   alloc_entry->next = NULL;
357
   alloc_entry->query_size = len;
358

359
   return alloc_entry;
360
}
361

362
/**
363
 * Allocate a memory slot for a query of the specified type.
364
 * It will first search through the memory blocks that are allocated
365
 * for the query type. If no memory slot is available, it will try
366
 * to allocate another memory block within the query object memory for
367
 * this query type.
368
 */
369
static int
370
allocate_query(struct svga_context *svga,
371
               SVGA3dQueryType type,
372
               unsigned len)
373
{
374
   struct svga_qmem_alloc_entry *alloc_entry;
375
   int slot_index = -1;
376
   unsigned offset;
377

378
   assert(type < SVGA3D_QUERYTYPE_MAX);
379

380
   alloc_entry = svga->gb_query_map[type];
381

382
   if (!alloc_entry) {
383
      /**
384
       * No query memory block has been allocated for this query type,
385
       * allocate one now
386
       */
387
      alloc_entry = allocate_query_block_entry(svga, len);
388
      if (!alloc_entry)
389
         return -1;
390
      svga->gb_query_map[type] = alloc_entry;
391
   }
392

393
   /* Allocate a slot within the memory block allocated for this query type */
394
   slot_index = allocate_query_slot(svga, alloc_entry);
395

396
   if (slot_index == -1) {
397
      /* This query memory block is full, allocate another one */
398
      alloc_entry = allocate_query_block_entry(svga, len);
399
      if (!alloc_entry)
400
         return -1;
401
      alloc_entry->next = svga->gb_query_map[type];
402
      svga->gb_query_map[type] = alloc_entry;
403
      slot_index = allocate_query_slot(svga, alloc_entry);
404
   }
405

406
   assert(slot_index != -1);
407
   offset = slot_index * len + alloc_entry->start_offset;
408

409
   return offset;
410
}
411

412

413
/**
414
 * Deallocate memory slot allocated for the specified query
415
 */
416
static void
417
deallocate_query(struct svga_context *svga,
418
                 struct svga_query *sq)
419
{
420
   struct svga_qmem_alloc_entry *alloc_entry;
421
   unsigned slot_index;
422
   unsigned offset = sq->offset;
423

424
   alloc_entry = svga->gb_query_map[sq->svga_type];
425

426
   while (alloc_entry) {
427
      if (offset >= alloc_entry->start_offset &&
428
          offset < alloc_entry->start_offset + SVGA_QUERY_MEM_BLOCK_SIZE) {
429

430
         /* The slot belongs to this memory block, deallocate it */
431
         slot_index = (offset - alloc_entry->start_offset) /
432
                      alloc_entry->query_size;
433
         deallocate_query_slot(svga, alloc_entry, slot_index);
434
         alloc_entry = NULL;
435
      } else {
436
         alloc_entry = alloc_entry->next;
437
      }
438
   }
439
}
440

441

442
/**
443
 * Destroy the gb query object and all the related query structures
444
 */
445
static void
446
destroy_gb_query_obj(struct svga_context *svga)
447
{
448
   struct svga_winsys_screen *sws = svga_screen(svga->pipe.screen)->sws;
449
   unsigned i;
450

451
   for (i = 0; i < SVGA3D_QUERYTYPE_MAX; i++) {
452
      struct svga_qmem_alloc_entry *alloc_entry, *next;
453
      alloc_entry = svga->gb_query_map[i];
454
      while (alloc_entry) {
455
         next = alloc_entry->next;
456
         util_bitmask_destroy(alloc_entry->alloc_mask);
457
         FREE(alloc_entry);
458
         alloc_entry = next;
459
      }
460
      svga->gb_query_map[i] = NULL;
461
   }
462

463
   if (svga->gb_query)
464
      sws->query_destroy(sws, svga->gb_query);
465
   svga->gb_query = NULL;
466

467
   util_bitmask_destroy(svga->gb_query_alloc_mask);
468
}
469

470
/**
471
 * Define query and create the gb query object if it is not already created.
472
 * There is only one gb query object per context which will be shared by
473
 * queries of all types.
474
 */
475
static enum pipe_error
476
define_query_vgpu10(struct svga_context *svga,
477
                    struct svga_query *sq, int resultLen)
478
{
479
   struct svga_winsys_screen *sws = svga_screen(svga->pipe.screen)->sws;
480
   int qlen;
481
   enum pipe_error ret = PIPE_OK;
482

483
   SVGA_DBG(DEBUG_QUERY, "%s\n", __FUNCTION__);
484

485
   if (svga->gb_query == NULL) {
486
      /* Create a gb query object */
487
      svga->gb_query = sws->query_create(sws, SVGA_QUERY_MEM_SIZE);
488
      if (!svga->gb_query)
489
         return PIPE_ERROR_OUT_OF_MEMORY;
490
      svga->gb_query_len = SVGA_QUERY_MEM_SIZE;
491
      memset (svga->gb_query_map, 0, sizeof(svga->gb_query_map));
492
      svga->gb_query_alloc_mask = util_bitmask_create();
493

494
      /* Bind the query object to the context */
495
      SVGA_RETRY(svga, svga->swc->query_bind(svga->swc, svga->gb_query,
496
                                             SVGA_QUERY_FLAG_SET));
497
   }
498

499
   sq->gb_query = svga->gb_query;
500

501
   /* Make sure query length is in multiples of 8 bytes */
502
   qlen = align(resultLen + sizeof(SVGA3dQueryState), 8);
503

504
   /* Find a slot for this query in the gb object */
505
   sq->offset = allocate_query(svga, sq->svga_type, qlen);
506
   if (sq->offset == -1)
507
      return PIPE_ERROR_OUT_OF_MEMORY;
508

509
   assert((sq->offset & 7) == 0);
510

511
   SVGA_DBG(DEBUG_QUERY, "   query type=%d qid=0x%x offset=%d\n",
512
            sq->svga_type, sq->id, sq->offset);
513

514
   /**
515
    * Send SVGA3D commands to define the query
516
    */
517
   SVGA_RETRY_OOM(svga, ret, SVGA3D_vgpu10_DefineQuery(svga->swc, sq->id,
518
                                                       sq->svga_type,
519
                                                       sq->flags));
520
   if (ret != PIPE_OK)
521
      return PIPE_ERROR_OUT_OF_MEMORY;
522

523
   SVGA_RETRY(svga, SVGA3D_vgpu10_BindQuery(svga->swc, sq->gb_query, sq->id));
524
   SVGA_RETRY(svga, SVGA3D_vgpu10_SetQueryOffset(svga->swc, sq->id,
525
                                                 sq->offset));
526

527
   return PIPE_OK;
528
}
529

530
static void
531
destroy_query_vgpu10(struct svga_context *svga, struct svga_query *sq)
532
{
533
   SVGA_RETRY(svga, SVGA3D_vgpu10_DestroyQuery(svga->swc, sq->id));
534

535
   /* Deallocate the memory slot allocated for this query */
536
   deallocate_query(svga, sq);
537
}
538

539

540
/**
541
 * Rebind queryies to the context.
542
 */
543
static void
544
rebind_vgpu10_query(struct svga_context *svga)
545
{
546
   SVGA_RETRY(svga, svga->swc->query_bind(svga->swc, svga->gb_query,
547
                                          SVGA_QUERY_FLAG_REF));
548
   svga->rebind.flags.query = FALSE;
549
}
550

551

552
static enum pipe_error
553
begin_query_vgpu10(struct svga_context *svga, struct svga_query *sq)
554
{
555
   struct svga_winsys_screen *sws = svga_screen(svga->pipe.screen)->sws;
556
   int status = 0;
557

558
   sws->fence_reference(sws, &sq->fence, NULL);
559

560
   /* Initialize the query state to NEW */
561
   status = sws->query_init(sws, sq->gb_query, sq->offset, SVGA3D_QUERYSTATE_NEW);
562
   if (status)
563
      return PIPE_ERROR;
564

565
   if (svga->rebind.flags.query) {
566
      rebind_vgpu10_query(svga);
567
   }
568

569
   /* Send the BeginQuery command to the device */
570
   SVGA_RETRY(svga, SVGA3D_vgpu10_BeginQuery(svga->swc, sq->id));
571
   return PIPE_OK;
572
}
573

574
static void
575
end_query_vgpu10(struct svga_context *svga, struct svga_query *sq)
576
{
577
   if (svga->rebind.flags.query) {
578
      rebind_vgpu10_query(svga);
579
   }
580

581
   SVGA_RETRY(svga, SVGA3D_vgpu10_EndQuery(svga->swc, sq->id));
582
}
583

584
static bool
585
get_query_result_vgpu10(struct svga_context *svga, struct svga_query *sq,
586
                        bool wait, void *result, int resultLen)
587
{
588
   struct svga_winsys_screen *sws = svga_screen(svga->pipe.screen)->sws;
589
   SVGA3dQueryState queryState;
590

591
   if (svga->rebind.flags.query) {
592
      rebind_vgpu10_query(svga);
593
   }
594

595
   sws->query_get_result(sws, sq->gb_query, sq->offset, &queryState, result, resultLen);
596

597
   if (queryState != SVGA3D_QUERYSTATE_SUCCEEDED && !sq->fence) {
598
      /* We don't have the query result yet, and the query hasn't been
599
       * submitted.  We need to submit it now since the GL spec says
600
       * "Querying the state for a given occlusion query forces that
601
       * occlusion query to complete within a finite amount of time."
602
       */
603
      svga_context_flush(svga, &sq->fence);
604
   }
605

606
   if (queryState == SVGA3D_QUERYSTATE_PENDING ||
607
       queryState == SVGA3D_QUERYSTATE_NEW) {
608
      if (!wait)
609
         return false;
610
      sws->fence_finish(sws, sq->fence, PIPE_TIMEOUT_INFINITE,
611
                        SVGA_FENCE_FLAG_QUERY);
612
      sws->query_get_result(sws, sq->gb_query, sq->offset, &queryState, result, resultLen);
613
   }
614

615
   assert(queryState == SVGA3D_QUERYSTATE_SUCCEEDED ||
616
          queryState == SVGA3D_QUERYSTATE_FAILED);
617

618
   return true;
619
}
620

621
static struct pipe_query *
622
svga_create_query(struct pipe_context *pipe,
623
                  unsigned query_type,
624
                  unsigned index)
625
{
626
   struct svga_context *svga = svga_context(pipe);
627
   struct svga_query *sq;
628
   enum pipe_error ret;
629

630
   assert(query_type < SVGA_QUERY_MAX);
631

632
   sq = CALLOC_STRUCT(svga_query);
633
   if (!sq)
634
      goto fail;
635

636
   /* Allocate an integer ID for the query */
637
   sq->id = util_bitmask_add(svga->query_id_bm);
638
   if (sq->id == UTIL_BITMASK_INVALID_INDEX)
639
      goto fail;
640

641
   SVGA_DBG(DEBUG_QUERY, "%s type=%d sq=0x%x id=%d\n", __FUNCTION__,
642
            query_type, sq, sq->id);
643

644
   switch (query_type) {
645
   case PIPE_QUERY_OCCLUSION_COUNTER:
646
      sq->svga_type = SVGA3D_QUERYTYPE_OCCLUSION;
647
      if (svga_have_vgpu10(svga)) {
648
         ret = define_query_vgpu10(svga, sq,
649
                                   sizeof(SVGADXOcclusionQueryResult));
650
         if (ret != PIPE_OK)
651
            goto fail;
652

653
         /**
654
          * In OpenGL, occlusion counter query can be used in conditional
655
          * rendering; however, in DX10, only OCCLUSION_PREDICATE query can
656
          * be used for predication. Hence, we need to create an occlusion
657
          * predicate query along with the occlusion counter query. So when
658
          * the occlusion counter query is used for predication, the associated
659
          * query of occlusion predicate type will be used
660
          * in the SetPredication command.
661
          */
662
         sq->predicate = svga_create_query(pipe, PIPE_QUERY_OCCLUSION_PREDICATE, index);
663

664
      } else {
665
         ret = define_query_vgpu9(svga, sq);
666
         if (ret != PIPE_OK)
667
            goto fail;
668
      }
669
      break;
670
   case PIPE_QUERY_OCCLUSION_PREDICATE:
671
   case PIPE_QUERY_OCCLUSION_PREDICATE_CONSERVATIVE:
672
      if (svga_have_vgpu10(svga)) {
673
         sq->svga_type = SVGA3D_QUERYTYPE_OCCLUSIONPREDICATE;
674
         ret = define_query_vgpu10(svga, sq,
675
                                   sizeof(SVGADXOcclusionPredicateQueryResult));
676
         if (ret != PIPE_OK)
677
            goto fail;
678
      } else {
679
         sq->svga_type = SVGA3D_QUERYTYPE_OCCLUSION;
680
         ret = define_query_vgpu9(svga, sq);
681
         if (ret != PIPE_OK)
682
            goto fail;
683
      }
684
      break;
685
   case PIPE_QUERY_PRIMITIVES_GENERATED:
686
   case PIPE_QUERY_PRIMITIVES_EMITTED:
687
   case PIPE_QUERY_SO_STATISTICS:
688
      assert(svga_have_vgpu10(svga));
689

690
      /* Until the device supports the new query type for multiple streams,
691
       * we will use the single stream query type for stream 0.
692
       */
693
      if (svga_have_sm5(svga) && index > 0) {
694
         assert(index < 4);
695

696
         sq->svga_type = SVGA3D_QUERYTYPE_SOSTATS_STREAM0 + index;
697
      }
698
      else {
699
         assert(index == 0);
700
         sq->svga_type = SVGA3D_QUERYTYPE_STREAMOUTPUTSTATS;
701
      }
702
      ret = define_query_vgpu10(svga, sq,
703
                                sizeof(SVGADXStreamOutStatisticsQueryResult));
704
      if (ret != PIPE_OK)
705
         goto fail;
706
      break;
707
   case PIPE_QUERY_TIMESTAMP:
708
      assert(svga_have_vgpu10(svga));
709
      sq->svga_type = SVGA3D_QUERYTYPE_TIMESTAMP;
710
      ret = define_query_vgpu10(svga, sq,
711
                                sizeof(SVGADXTimestampQueryResult));
712
      if (ret != PIPE_OK)
713
         goto fail;
714
      break;
715
   case SVGA_QUERY_NUM_DRAW_CALLS:
716
   case SVGA_QUERY_NUM_FALLBACKS:
717
   case SVGA_QUERY_NUM_FLUSHES:
718
   case SVGA_QUERY_NUM_VALIDATIONS:
719
   case SVGA_QUERY_NUM_BUFFERS_MAPPED:
720
   case SVGA_QUERY_NUM_TEXTURES_MAPPED:
721
   case SVGA_QUERY_NUM_BYTES_UPLOADED:
722
   case SVGA_QUERY_NUM_COMMAND_BUFFERS:
723
   case SVGA_QUERY_COMMAND_BUFFER_SIZE:
724
   case SVGA_QUERY_SURFACE_WRITE_FLUSHES:
725
   case SVGA_QUERY_MEMORY_USED:
726
   case SVGA_QUERY_NUM_SHADERS:
727
   case SVGA_QUERY_NUM_RESOURCES:
728
   case SVGA_QUERY_NUM_STATE_OBJECTS:
729
   case SVGA_QUERY_NUM_SURFACE_VIEWS:
730
   case SVGA_QUERY_NUM_GENERATE_MIPMAP:
731
   case SVGA_QUERY_NUM_READBACKS:
732
   case SVGA_QUERY_NUM_RESOURCE_UPDATES:
733
   case SVGA_QUERY_NUM_BUFFER_UPLOADS:
734
   case SVGA_QUERY_NUM_CONST_BUF_UPDATES:
735
   case SVGA_QUERY_NUM_CONST_UPDATES:
736
   case SVGA_QUERY_NUM_FAILED_ALLOCATIONS:
737
   case SVGA_QUERY_NUM_COMMANDS_PER_DRAW:
738
   case SVGA_QUERY_NUM_SHADER_RELOCATIONS:
739
   case SVGA_QUERY_NUM_SURFACE_RELOCATIONS:
740
   case SVGA_QUERY_SHADER_MEM_USED:
741
      break;
742
   case SVGA_QUERY_FLUSH_TIME:
743
   case SVGA_QUERY_MAP_BUFFER_TIME:
744
      /* These queries need os_time_get() */
745
      svga->hud.uses_time = TRUE;
746
      break;
747

748
   default:
749
      assert(!"unexpected query type in svga_create_query()");
750
   }
751

752
   sq->type = query_type;
753

754
   return &sq->base;
755

756
fail:
757
   FREE(sq);
758
   return NULL;
759
}
760

761
static void
762
svga_destroy_query(struct pipe_context *pipe, struct pipe_query *q)
763
{
764
   struct svga_context *svga = svga_context(pipe);
765
   struct svga_winsys_screen *sws = svga_screen(svga->pipe.screen)->sws;
766
   struct svga_query *sq;
767

768
   if (!q) {
769
      destroy_gb_query_obj(svga);
770
      return;
771
   }
772

773
   sq = svga_query(q);
774

775
   SVGA_DBG(DEBUG_QUERY, "%s sq=0x%x id=%d\n", __FUNCTION__,
776
            sq, sq->id);
777

778
   switch (sq->type) {
779
   case PIPE_QUERY_OCCLUSION_COUNTER:
780
   case PIPE_QUERY_OCCLUSION_PREDICATE:
781
   case PIPE_QUERY_OCCLUSION_PREDICATE_CONSERVATIVE:
782
      if (svga_have_vgpu10(svga)) {
783
         /* make sure to also destroy any associated predicate query */
784
         if (sq->predicate)
785
            svga_destroy_query(pipe, sq->predicate);
786
         destroy_query_vgpu10(svga, sq);
787
      } else {
788
         sws->buffer_destroy(sws, sq->hwbuf);
789
      }
790
      sws->fence_reference(sws, &sq->fence, NULL);
791
      break;
792
   case PIPE_QUERY_PRIMITIVES_GENERATED:
793
   case PIPE_QUERY_PRIMITIVES_EMITTED:
794
   case PIPE_QUERY_SO_STATISTICS:
795
   case PIPE_QUERY_TIMESTAMP:
796
      assert(svga_have_vgpu10(svga));
797
      destroy_query_vgpu10(svga, sq);
798
      sws->fence_reference(sws, &sq->fence, NULL);
799
      break;
800
   case SVGA_QUERY_NUM_DRAW_CALLS:
801
   case SVGA_QUERY_NUM_FALLBACKS:
802
   case SVGA_QUERY_NUM_FLUSHES:
803
   case SVGA_QUERY_NUM_VALIDATIONS:
804
   case SVGA_QUERY_MAP_BUFFER_TIME:
805
   case SVGA_QUERY_NUM_BUFFERS_MAPPED:
806
   case SVGA_QUERY_NUM_TEXTURES_MAPPED:
807
   case SVGA_QUERY_NUM_BYTES_UPLOADED:
808
   case SVGA_QUERY_NUM_COMMAND_BUFFERS:
809
   case SVGA_QUERY_COMMAND_BUFFER_SIZE:
810
   case SVGA_QUERY_FLUSH_TIME:
811
   case SVGA_QUERY_SURFACE_WRITE_FLUSHES:
812
   case SVGA_QUERY_MEMORY_USED:
813
   case SVGA_QUERY_NUM_SHADERS:
814
   case SVGA_QUERY_NUM_RESOURCES:
815
   case SVGA_QUERY_NUM_STATE_OBJECTS:
816
   case SVGA_QUERY_NUM_SURFACE_VIEWS:
817
   case SVGA_QUERY_NUM_GENERATE_MIPMAP:
818
   case SVGA_QUERY_NUM_READBACKS:
819
   case SVGA_QUERY_NUM_RESOURCE_UPDATES:
820
   case SVGA_QUERY_NUM_BUFFER_UPLOADS:
821
   case SVGA_QUERY_NUM_CONST_BUF_UPDATES:
822
   case SVGA_QUERY_NUM_CONST_UPDATES:
823
   case SVGA_QUERY_NUM_FAILED_ALLOCATIONS:
824
   case SVGA_QUERY_NUM_COMMANDS_PER_DRAW:
825
   case SVGA_QUERY_NUM_SHADER_RELOCATIONS:
826
   case SVGA_QUERY_NUM_SURFACE_RELOCATIONS:
827
   case SVGA_QUERY_SHADER_MEM_USED:
828
      /* nothing */
829
      break;
830
   default:
831
      assert(!"svga: unexpected query type in svga_destroy_query()");
832
   }
833

834
   /* Free the query id */
835
   util_bitmask_clear(svga->query_id_bm, sq->id);
836

837
   FREE(sq);
838
}
839

840

841
static bool
842
svga_begin_query(struct pipe_context *pipe, struct pipe_query *q)
843
{
844
   struct svga_context *svga = svga_context(pipe);
845
   struct svga_query *sq = svga_query(q);
846
   enum pipe_error ret = PIPE_OK;
847

848
   assert(sq);
849
   assert(sq->type < SVGA_QUERY_MAX);
850

851
   /* Need to flush out buffered drawing commands so that they don't
852
    * get counted in the query results.
853
    */
854
   svga_hwtnl_flush_retry(svga);
855

856
   switch (sq->type) {
857
   case PIPE_QUERY_OCCLUSION_COUNTER:
858
   case PIPE_QUERY_OCCLUSION_PREDICATE:
859
   case PIPE_QUERY_OCCLUSION_PREDICATE_CONSERVATIVE:
860
      if (svga_have_vgpu10(svga)) {
861
         ret = begin_query_vgpu10(svga, sq);
862
         /* also need to start the associated occlusion predicate query */
863
         if (sq->predicate) {
864
            enum pipe_error status;
865
            status = begin_query_vgpu10(svga, svga_query(sq->predicate));
866
            assert(status == PIPE_OK);
867
            (void) status;
868
         }
869
      } else {
870
         begin_query_vgpu9(svga, sq);
871
      }
872
      assert(ret == PIPE_OK);
873
      (void) ret;
874
      break;
875
   case PIPE_QUERY_PRIMITIVES_GENERATED:
876
   case PIPE_QUERY_PRIMITIVES_EMITTED:
877
   case PIPE_QUERY_SO_STATISTICS:
878
   case PIPE_QUERY_TIMESTAMP:
879
      assert(svga_have_vgpu10(svga));
880
      ret = begin_query_vgpu10(svga, sq);
881
      assert(ret == PIPE_OK);
882
      break;
883
   case SVGA_QUERY_NUM_DRAW_CALLS:
884
      sq->begin_count = svga->hud.num_draw_calls;
885
      break;
886
   case SVGA_QUERY_NUM_FALLBACKS:
887
      sq->begin_count = svga->hud.num_fallbacks;
888
      break;
889
   case SVGA_QUERY_NUM_FLUSHES:
890
      sq->begin_count = svga->hud.num_flushes;
891
      break;
892
   case SVGA_QUERY_NUM_VALIDATIONS:
893
      sq->begin_count = svga->hud.num_validations;
894
      break;
895
   case SVGA_QUERY_MAP_BUFFER_TIME:
896
      sq->begin_count = svga->hud.map_buffer_time;
897
      break;
898
   case SVGA_QUERY_NUM_BUFFERS_MAPPED:
899
      sq->begin_count = svga->hud.num_buffers_mapped;
900
      break;
901
   case SVGA_QUERY_NUM_TEXTURES_MAPPED:
902
      sq->begin_count = svga->hud.num_textures_mapped;
903
      break;
904
   case SVGA_QUERY_NUM_BYTES_UPLOADED:
905
      sq->begin_count = svga->hud.num_bytes_uploaded;
906
      break;
907
   case SVGA_QUERY_NUM_COMMAND_BUFFERS:
908
      sq->begin_count = svga->swc->num_command_buffers;
909
      break;
910
   case SVGA_QUERY_COMMAND_BUFFER_SIZE:
911
      sq->begin_count = svga->hud.command_buffer_size;
912
      break;
913
   case SVGA_QUERY_FLUSH_TIME:
914
      sq->begin_count = svga->hud.flush_time;
915
      break;
916
   case SVGA_QUERY_SURFACE_WRITE_FLUSHES:
917
      sq->begin_count = svga->hud.surface_write_flushes;
918
      break;
919
   case SVGA_QUERY_NUM_READBACKS:
920
      sq->begin_count = svga->hud.num_readbacks;
921
      break;
922
   case SVGA_QUERY_NUM_RESOURCE_UPDATES:
923
      sq->begin_count = svga->hud.num_resource_updates;
924
      break;
925
   case SVGA_QUERY_NUM_BUFFER_UPLOADS:
926
      sq->begin_count = svga->hud.num_buffer_uploads;
927
      break;
928
   case SVGA_QUERY_NUM_CONST_BUF_UPDATES:
929
      sq->begin_count = svga->hud.num_const_buf_updates;
930
      break;
931
   case SVGA_QUERY_NUM_CONST_UPDATES:
932
      sq->begin_count = svga->hud.num_const_updates;
933
      break;
934
   case SVGA_QUERY_NUM_SHADER_RELOCATIONS:
935
      sq->begin_count = svga->swc->num_shader_reloc;
936
      break;
937
   case SVGA_QUERY_NUM_SURFACE_RELOCATIONS:
938
      sq->begin_count = svga->swc->num_surf_reloc;
939
      break;
940
   case SVGA_QUERY_MEMORY_USED:
941
   case SVGA_QUERY_NUM_SHADERS:
942
   case SVGA_QUERY_NUM_RESOURCES:
943
   case SVGA_QUERY_NUM_STATE_OBJECTS:
944
   case SVGA_QUERY_NUM_SURFACE_VIEWS:
945
   case SVGA_QUERY_NUM_GENERATE_MIPMAP:
946
   case SVGA_QUERY_NUM_FAILED_ALLOCATIONS:
947
   case SVGA_QUERY_NUM_COMMANDS_PER_DRAW:
948
   case SVGA_QUERY_SHADER_MEM_USED:
949
      /* nothing */
950
      break;
951
   default:
952
      assert(!"unexpected query type in svga_begin_query()");
953
   }
954

955
   SVGA_DBG(DEBUG_QUERY, "%s sq=0x%x id=%d type=%d svga_type=%d\n",
956
            __FUNCTION__, sq, sq->id, sq->type, sq->svga_type);
957

958
   sq->active = TRUE;
959

960
   return true;
961
}
962

963

964
static bool
965
svga_end_query(struct pipe_context *pipe, struct pipe_query *q)
966
{
967
   struct svga_context *svga = svga_context(pipe);
968
   struct svga_query *sq = svga_query(q);
969

970
   assert(sq);
971
   assert(sq->type < SVGA_QUERY_MAX);
972

973
   SVGA_DBG(DEBUG_QUERY, "%s sq=0x%x type=%d\n",
974
            __FUNCTION__, sq, sq->type);
975

976
   if (sq->type == PIPE_QUERY_TIMESTAMP && !sq->active)
977
      svga_begin_query(pipe, q);
978

979
   SVGA_DBG(DEBUG_QUERY, "%s sq=0x%x id=%d type=%d svga_type=%d\n",
980
            __FUNCTION__, sq, sq->id, sq->type, sq->svga_type);
981

982
   svga_hwtnl_flush_retry(svga);
983

984
   assert(sq->active);
985

986
   switch (sq->type) {
987
   case PIPE_QUERY_OCCLUSION_COUNTER:
988
   case PIPE_QUERY_OCCLUSION_PREDICATE:
989
   case PIPE_QUERY_OCCLUSION_PREDICATE_CONSERVATIVE:
990
      if (svga_have_vgpu10(svga)) {
991
         end_query_vgpu10(svga, sq);
992
         /* also need to end the associated occlusion predicate query */
993
         if (sq->predicate) {
994
            end_query_vgpu10(svga, svga_query(sq->predicate));
995
         }
996
      } else {
997
         end_query_vgpu9(svga, sq);
998
      }
999
      break;
1000
   case PIPE_QUERY_PRIMITIVES_GENERATED:
1001
   case PIPE_QUERY_PRIMITIVES_EMITTED:
1002
   case PIPE_QUERY_SO_STATISTICS:
1003
   case PIPE_QUERY_TIMESTAMP:
1004
      assert(svga_have_vgpu10(svga));
1005
      end_query_vgpu10(svga, sq);
1006
      break;
1007
   case SVGA_QUERY_NUM_DRAW_CALLS:
1008
      sq->end_count = svga->hud.num_draw_calls;
1009
      break;
1010
   case SVGA_QUERY_NUM_FALLBACKS:
1011
      sq->end_count = svga->hud.num_fallbacks;
1012
      break;
1013
   case SVGA_QUERY_NUM_FLUSHES:
1014
      sq->end_count = svga->hud.num_flushes;
1015
      break;
1016
   case SVGA_QUERY_NUM_VALIDATIONS:
1017
      sq->end_count = svga->hud.num_validations;
1018
      break;
1019
   case SVGA_QUERY_MAP_BUFFER_TIME:
1020
      sq->end_count = svga->hud.map_buffer_time;
1021
      break;
1022
   case SVGA_QUERY_NUM_BUFFERS_MAPPED:
1023
      sq->end_count = svga->hud.num_buffers_mapped;
1024
      break;
1025
   case SVGA_QUERY_NUM_TEXTURES_MAPPED:
1026
      sq->end_count = svga->hud.num_textures_mapped;
1027
      break;
1028
   case SVGA_QUERY_NUM_BYTES_UPLOADED:
1029
      sq->end_count = svga->hud.num_bytes_uploaded;
1030
      break;
1031
   case SVGA_QUERY_NUM_COMMAND_BUFFERS:
1032
      sq->end_count = svga->swc->num_command_buffers;
1033
      break;
1034
   case SVGA_QUERY_COMMAND_BUFFER_SIZE:
1035
      sq->end_count = svga->hud.command_buffer_size;
1036
      break;
1037
   case SVGA_QUERY_FLUSH_TIME:
1038
      sq->end_count = svga->hud.flush_time;
1039
      break;
1040
   case SVGA_QUERY_SURFACE_WRITE_FLUSHES:
1041
      sq->end_count = svga->hud.surface_write_flushes;
1042
      break;
1043
   case SVGA_QUERY_NUM_READBACKS:
1044
      sq->end_count = svga->hud.num_readbacks;
1045
      break;
1046
   case SVGA_QUERY_NUM_RESOURCE_UPDATES:
1047
      sq->end_count = svga->hud.num_resource_updates;
1048
      break;
1049
   case SVGA_QUERY_NUM_BUFFER_UPLOADS:
1050
      sq->end_count = svga->hud.num_buffer_uploads;
1051
      break;
1052
   case SVGA_QUERY_NUM_CONST_BUF_UPDATES:
1053
      sq->end_count = svga->hud.num_const_buf_updates;
1054
      break;
1055
   case SVGA_QUERY_NUM_CONST_UPDATES:
1056
      sq->end_count = svga->hud.num_const_updates;
1057
      break;
1058
   case SVGA_QUERY_NUM_SHADER_RELOCATIONS:
1059
      sq->end_count = svga->swc->num_shader_reloc;
1060
      break;
1061
   case SVGA_QUERY_NUM_SURFACE_RELOCATIONS:
1062
      sq->end_count = svga->swc->num_surf_reloc;
1063
      break;
1064
   case SVGA_QUERY_MEMORY_USED:
1065
   case SVGA_QUERY_NUM_SHADERS:
1066
   case SVGA_QUERY_NUM_RESOURCES:
1067
   case SVGA_QUERY_NUM_STATE_OBJECTS:
1068
   case SVGA_QUERY_NUM_SURFACE_VIEWS:
1069
   case SVGA_QUERY_NUM_GENERATE_MIPMAP:
1070
   case SVGA_QUERY_NUM_FAILED_ALLOCATIONS:
1071
   case SVGA_QUERY_NUM_COMMANDS_PER_DRAW:
1072
   case SVGA_QUERY_SHADER_MEM_USED:
1073
      /* nothing */
1074
      break;
1075
   default:
1076
      assert(!"unexpected query type in svga_end_query()");
1077
   }
1078
   sq->active = FALSE;
1079
   return true;
1080
}
1081

1082

1083
static bool
1084
svga_get_query_result(struct pipe_context *pipe,
1085
                      struct pipe_query *q,
1086
                      bool wait,
1087
                      union pipe_query_result *vresult)
1088
{
1089
   struct svga_screen *svgascreen = svga_screen(pipe->screen);
1090
   struct svga_context *svga = svga_context(pipe);
1091
   struct svga_query *sq = svga_query(q);
1092
   uint64_t *result = (uint64_t *)vresult;
1093
   bool ret = true;
1094

1095
   assert(sq);
1096

1097
   SVGA_DBG(DEBUG_QUERY, "%s sq=0x%x id=%d wait: %d\n",
1098
            __FUNCTION__, sq, sq->id, wait);
1099

1100
   switch (sq->type) {
1101
   case PIPE_QUERY_OCCLUSION_COUNTER:
1102
      if (svga_have_vgpu10(svga)) {
1103
         SVGADXOcclusionQueryResult occResult;
1104
         ret = get_query_result_vgpu10(svga, sq, wait,
1105
                                       (void *)&occResult, sizeof(occResult));
1106
         *result = (uint64_t)occResult.samplesRendered;
1107
      } else {
1108
         ret = get_query_result_vgpu9(svga, sq, wait, result);
1109
      }
1110
      break;
1111
   case PIPE_QUERY_OCCLUSION_PREDICATE:
1112
   case PIPE_QUERY_OCCLUSION_PREDICATE_CONSERVATIVE: {
1113
      if (svga_have_vgpu10(svga)) {
1114
         SVGADXOcclusionPredicateQueryResult occResult;
1115
         ret = get_query_result_vgpu10(svga, sq, wait,
1116
                                       (void *)&occResult, sizeof(occResult));
1117
         vresult->b = occResult.anySamplesRendered != 0;
1118
      } else {
1119
         uint64_t count = 0;
1120
         ret = get_query_result_vgpu9(svga, sq, wait, &count);
1121
         vresult->b = count != 0;
1122
      }
1123
      break;
1124
   }
1125
   case PIPE_QUERY_SO_STATISTICS: {
1126
      SVGADXStreamOutStatisticsQueryResult sResult;
1127
      struct pipe_query_data_so_statistics *pResult =
1128
         (struct pipe_query_data_so_statistics *)vresult;
1129

1130
      assert(svga_have_vgpu10(svga));
1131
      ret = get_query_result_vgpu10(svga, sq, wait,
1132
                                    (void *)&sResult, sizeof(sResult));
1133
      pResult->num_primitives_written = sResult.numPrimitivesWritten;
1134
      pResult->primitives_storage_needed = sResult.numPrimitivesRequired;
1135
      break;
1136
   }
1137
   case PIPE_QUERY_TIMESTAMP: {
1138
      SVGADXTimestampQueryResult sResult;
1139

1140
      assert(svga_have_vgpu10(svga));
1141
      ret = get_query_result_vgpu10(svga, sq, wait,
1142
                                    (void *)&sResult, sizeof(sResult));
1143
      *result = (uint64_t)sResult.timestamp;
1144
      break;
1145
   }
1146
   case PIPE_QUERY_PRIMITIVES_GENERATED: {
1147
      SVGADXStreamOutStatisticsQueryResult sResult;
1148

1149
      assert(svga_have_vgpu10(svga));
1150
      ret = get_query_result_vgpu10(svga, sq, wait,
1151
                                    (void *)&sResult, sizeof sResult);
1152
      *result = (uint64_t)sResult.numPrimitivesRequired;
1153
      break;
1154
   }
1155
   case PIPE_QUERY_PRIMITIVES_EMITTED: {
1156
      SVGADXStreamOutStatisticsQueryResult sResult;
1157

1158
      assert(svga_have_vgpu10(svga));
1159
      ret = get_query_result_vgpu10(svga, sq, wait,
1160
                                    (void *)&sResult, sizeof sResult);
1161
      *result = (uint64_t)sResult.numPrimitivesWritten;
1162
      break;
1163
   }
1164
   /* These are per-frame counters */
1165
   case SVGA_QUERY_NUM_DRAW_CALLS:
1166
   case SVGA_QUERY_NUM_FALLBACKS:
1167
   case SVGA_QUERY_NUM_FLUSHES:
1168
   case SVGA_QUERY_NUM_VALIDATIONS:
1169
   case SVGA_QUERY_MAP_BUFFER_TIME:
1170
   case SVGA_QUERY_NUM_BUFFERS_MAPPED:
1171
   case SVGA_QUERY_NUM_TEXTURES_MAPPED:
1172
   case SVGA_QUERY_NUM_BYTES_UPLOADED:
1173
   case SVGA_QUERY_NUM_COMMAND_BUFFERS:
1174
   case SVGA_QUERY_COMMAND_BUFFER_SIZE:
1175
   case SVGA_QUERY_FLUSH_TIME:
1176
   case SVGA_QUERY_SURFACE_WRITE_FLUSHES:
1177
   case SVGA_QUERY_NUM_READBACKS:
1178
   case SVGA_QUERY_NUM_RESOURCE_UPDATES:
1179
   case SVGA_QUERY_NUM_BUFFER_UPLOADS:
1180
   case SVGA_QUERY_NUM_CONST_BUF_UPDATES:
1181
   case SVGA_QUERY_NUM_CONST_UPDATES:
1182
   case SVGA_QUERY_NUM_SHADER_RELOCATIONS:
1183
   case SVGA_QUERY_NUM_SURFACE_RELOCATIONS:
1184
      vresult->u64 = sq->end_count - sq->begin_count;
1185
      break;
1186
   /* These are running total counters */
1187
   case SVGA_QUERY_MEMORY_USED:
1188
      vresult->u64 = svgascreen->hud.total_resource_bytes;
1189
      break;
1190
   case SVGA_QUERY_NUM_SHADERS:
1191
      vresult->u64 = svga->hud.num_shaders;
1192
      break;
1193
   case SVGA_QUERY_NUM_RESOURCES:
1194
      vresult->u64 = svgascreen->hud.num_resources;
1195
      break;
1196
   case SVGA_QUERY_NUM_STATE_OBJECTS:
1197
      vresult->u64 = (svga->hud.num_blend_objects +
1198
                      svga->hud.num_depthstencil_objects +
1199
                      svga->hud.num_rasterizer_objects +
1200
                      svga->hud.num_sampler_objects +
1201
                      svga->hud.num_samplerview_objects +
1202
                      svga->hud.num_vertexelement_objects);
1203
      break;
1204
   case SVGA_QUERY_NUM_SURFACE_VIEWS:
1205
      vresult->u64 = svga->hud.num_surface_views;
1206
      break;
1207
   case SVGA_QUERY_NUM_GENERATE_MIPMAP:
1208
      vresult->u64 = svga->hud.num_generate_mipmap;
1209
      break;
1210
   case SVGA_QUERY_NUM_FAILED_ALLOCATIONS:
1211
      vresult->u64 = svgascreen->hud.num_failed_allocations;
1212
      break;
1213
   case SVGA_QUERY_NUM_COMMANDS_PER_DRAW:
1214
      vresult->f = (float) svga->swc->num_commands
1215
         / (float) svga->swc->num_draw_commands;
1216
      break;
1217
   case SVGA_QUERY_SHADER_MEM_USED:
1218
      vresult->u64 = svga->hud.shader_mem_used;
1219
      break;
1220
   default:
1221
      assert(!"unexpected query type in svga_get_query_result");
1222
   }
1223

1224
   SVGA_DBG(DEBUG_QUERY, "%s result %d\n", __FUNCTION__, *((uint64_t *)vresult));
1225

1226
   return ret;
1227
}
1228

1229
static void
1230
svga_render_condition(struct pipe_context *pipe, struct pipe_query *q,
1231
                      bool condition, enum pipe_render_cond_flag mode)
1232
{
1233
   struct svga_context *svga = svga_context(pipe);
1234
   struct svga_winsys_screen *sws = svga_screen(svga->pipe.screen)->sws;
1235
   struct svga_query *sq = svga_query(q);
1236
   SVGA3dQueryId queryId;
1237

1238
   SVGA_DBG(DEBUG_QUERY, "%s\n", __FUNCTION__);
1239

1240
   assert(svga_have_vgpu10(svga));
1241
   if (sq == NULL) {
1242
      queryId = SVGA3D_INVALID_ID;
1243
   }
1244
   else {
1245
      assert(sq->svga_type == SVGA3D_QUERYTYPE_OCCLUSION ||
1246
             sq->svga_type == SVGA3D_QUERYTYPE_OCCLUSIONPREDICATE);
1247

1248
      if (sq->svga_type == SVGA3D_QUERYTYPE_OCCLUSION) {
1249
         assert(sq->predicate);
1250
         /**
1251
          * For conditional rendering, make sure to use the associated
1252
          * predicate query.
1253
          */
1254
         sq = svga_query(sq->predicate);
1255
      }
1256
      queryId = sq->id;
1257

1258
      if ((mode == PIPE_RENDER_COND_WAIT ||
1259
           mode == PIPE_RENDER_COND_BY_REGION_WAIT) && sq->fence) {
1260
         sws->fence_finish(sws, sq->fence, PIPE_TIMEOUT_INFINITE,
1261
                           SVGA_FENCE_FLAG_QUERY);
1262
      }
1263
   }
1264
   /*
1265
    * if the kernel module doesn't support the predication command,
1266
    * we'll just render unconditionally.
1267
    * This is probably acceptable for the typical case of occlusion culling.
1268
    */
1269
   if (sws->have_set_predication_cmd) {
1270
      SVGA_RETRY(svga, SVGA3D_vgpu10_SetPredication(svga->swc, queryId,
1271
                                                    (uint32) condition));
1272
      svga->pred.query_id = queryId;
1273
      svga->pred.cond = condition;
1274
   }
1275

1276
   svga->render_condition = (sq != NULL);
1277
}
1278

1279

1280
/*
1281
 * This function is a workaround because we lack the ability to query
1282
 * renderer's time synchronously.
1283
 */
1284
static uint64_t
1285
svga_get_timestamp(struct pipe_context *pipe)
1286
{
1287
   struct pipe_query *q = svga_create_query(pipe, PIPE_QUERY_TIMESTAMP, 0);
1288
   union pipe_query_result result;
1289

1290
   svga_begin_query(pipe, q);
1291
   svga_end_query(pipe,q);
1292
   svga_get_query_result(pipe, q, TRUE, &result);
1293
   svga_destroy_query(pipe, q);
1294

1295
   return result.u64;
1296
}
1297

1298

1299
static void
1300
svga_set_active_query_state(struct pipe_context *pipe, bool enable)
1301
{
1302
}
1303

1304

1305
/**
1306
 * \brief Toggle conditional rendering if already enabled
1307
 *
1308
 * \param svga[in]  The svga context
1309
 * \param render_condition_enabled[in]  Whether to ignore requests to turn
1310
 * conditional rendering off
1311
 * \param on[in]  Whether to turn conditional rendering on or off
1312
 */
1313
void
1314
svga_toggle_render_condition(struct svga_context *svga,
1315
                             boolean render_condition_enabled,
1316
                             boolean on)
1317
{
1318
   SVGA3dQueryId query_id;
1319

1320
   if (render_condition_enabled ||
1321
       svga->pred.query_id == SVGA3D_INVALID_ID) {
1322
      return;
1323
   }
1324

1325
   /*
1326
    * If we get here, it means that the system supports
1327
    * conditional rendering since svga->pred.query_id has already been
1328
    * modified for this context and thus support has already been
1329
    * verified.
1330
    */
1331
   query_id = on ? svga->pred.query_id : SVGA3D_INVALID_ID;
1332

1333
   SVGA_RETRY(svga, SVGA3D_vgpu10_SetPredication(svga->swc, query_id,
1334
                                                 (uint32) svga->pred.cond));
1335
}
1336

1337

1338
void
1339
svga_init_query_functions(struct svga_context *svga)
1340
{
1341
   svga->pipe.create_query = svga_create_query;
1342
   svga->pipe.destroy_query = svga_destroy_query;
1343
   svga->pipe.begin_query = svga_begin_query;
1344
   svga->pipe.end_query = svga_end_query;
1345
   svga->pipe.get_query_result = svga_get_query_result;
1346
   svga->pipe.set_active_query_state = svga_set_active_query_state;
1347
   svga->pipe.render_condition = svga_render_condition;
1348
   svga->pipe.get_timestamp = svga_get_timestamp;
1349
}
1350

1351
Product

Resources

Company