blob: ddcef73c4561233ae3bd4f86d732468982291da3 [file] [log] [blame]
Chia-I Wue18ff1b2014-08-07 13:38:51 +08001/*
Courtney Goeltzenleuchter9cc421e2015-04-08 15:36:08 -06002 * Vulkan
Chia-I Wue18ff1b2014-08-07 13:38:51 +08003 *
4 * Copyright (C) 2014 LunarG, Inc.
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the "Software"),
8 * to deal in the Software without restriction, including without limitation
9 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
10 * and/or sell copies of the Software, and to permit persons to whom the
11 * Software is furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice shall be included
14 * in all copies or substantial portions of the Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
21 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
22 * DEALINGS IN THE SOFTWARE.
Chia-I Wu44e42362014-09-02 08:32:09 +080023 *
24 * Authors:
25 * Chia-I Wu <olv@lunarg.com>
Chia-I Wue18ff1b2014-08-07 13:38:51 +080026 */
27
28#include "dev.h"
29#include "mem.h"
30#include "query.h"
Courtney Goeltzenleuchter29862812015-04-16 09:13:59 -060031#include "genhw/genhw.h"
Chia-I Wue18ff1b2014-08-07 13:38:51 +080032
33static void query_destroy(struct intel_obj *obj)
34{
35 struct intel_query *query = intel_query_from_obj(obj);
36
Tony Barbour2094dc72015-07-09 15:26:32 -060037 intel_mem_free(obj->mem);
Chia-I Wue18ff1b2014-08-07 13:38:51 +080038 intel_query_destroy(query);
39}
40
Courtney Goeltzenleuchter29862812015-04-16 09:13:59 -060041static void query_init_pipeline_statistics(
42 struct intel_dev *dev,
43 const VkQueryPoolCreateInfo *info,
44 struct intel_query *query)
45{
46 /*
47 * Note: order defined by Vulkan spec.
48 */
49 const uint32_t regs[][2] = {
Courtney Goeltzenleuchterb93427c2015-10-15 16:57:32 -060050 {VK_QUERY_PIPELINE_STATISTIC_INPUT_ASSEMBLY_PRIMITIVES_BIT, GEN6_REG_IA_PRIMITIVES_COUNT},
51 {VK_QUERY_PIPELINE_STATISTIC_VERTEX_SHADER_INVOCATIONS_BIT, GEN6_REG_VS_INVOCATION_COUNT},
52 {VK_QUERY_PIPELINE_STATISTIC_GEOMETRY_SHADER_INVOCATIONS_BIT, GEN6_REG_GS_INVOCATION_COUNT},
53 {VK_QUERY_PIPELINE_STATISTIC_GEOMETRY_SHADER_PRIMITIVES_BIT, GEN6_REG_GS_PRIMITIVES_COUNT},
54 {VK_QUERY_PIPELINE_STATISTIC_CLIPPING_INVOCATIONS_BIT, GEN6_REG_CL_INVOCATION_COUNT},
55 {VK_QUERY_PIPELINE_STATISTIC_CLIPPING_PRIMITIVES_BIT, GEN6_REG_CL_PRIMITIVES_COUNT},
56 {VK_QUERY_PIPELINE_STATISTIC_FRAGMENT_SHADER_INVOCATIONS_BIT, GEN6_REG_PS_INVOCATION_COUNT},
57 {VK_QUERY_PIPELINE_STATISTIC_TESSELLATION_CONTROL_SHADER_PATCHES_BIT, (intel_gpu_gen(dev->gpu) >= INTEL_GEN(7)) ? GEN7_REG_HS_INVOCATION_COUNT : 0},
58 {VK_QUERY_PIPELINE_STATISTIC_TESSELLATION_EVALUATION_SHADER_INVOCATIONS_BIT, (intel_gpu_gen(dev->gpu) >= INTEL_GEN(7)) ? GEN7_REG_DS_INVOCATION_COUNT : 0},
59 {VK_QUERY_PIPELINE_STATISTIC_COMPUTE_SHADER_INVOCATIONS_BIT, 0}
Courtney Goeltzenleuchter29862812015-04-16 09:13:59 -060060 };
61 STATIC_ASSERT(ARRAY_SIZE(regs) < 32);
62 uint32_t i;
63 uint32_t reg_count = 0;
64
65 /*
66 * Only query registers indicated via pipeline statistics flags.
67 * If HW does not support a flag, fill value with 0.
68 */
69 for (i=0; i < ARRAY_SIZE(regs); i++) {
70 if ((regs[i][0] & info->pipelineStatistics)) {
71 query->regs[reg_count] = regs[i][1];
72 reg_count++;
73 }
74 }
75
76 query->reg_count = reg_count;
77 query->slot_stride = u_align(reg_count * sizeof(uint64_t) * 2, 64);
78}
79
Courtney Goeltzenleuchter382489d2015-04-10 08:34:15 -060080VkResult intel_query_create(struct intel_dev *dev,
Courtney Goeltzenleuchter29862812015-04-16 09:13:59 -060081 const VkQueryPoolCreateInfo *info,
82 struct intel_query **query_ret)
Chia-I Wue18ff1b2014-08-07 13:38:51 +080083{
84 struct intel_query *query;
85
Chia-I Wu545c2e12015-02-22 13:19:54 +080086 query = (struct intel_query *) intel_base_create(&dev->base.handle,
Courtney Goeltzenleuchter1c7c65d2015-06-10 17:39:03 -060087 sizeof(*query), dev->base.dbg, VK_OBJECT_TYPE_QUEUE,
Chia-I Wu545c2e12015-02-22 13:19:54 +080088 info, 0);
Chia-I Wue18ff1b2014-08-07 13:38:51 +080089 if (!query)
Tony Barbour8205d902015-04-16 15:59:00 -060090 return VK_ERROR_OUT_OF_HOST_MEMORY;
Chia-I Wue18ff1b2014-08-07 13:38:51 +080091
92 query->type = info->queryType;
93 query->slot_count = info->slots;
94
Chia-I Wu659650f2014-08-07 14:11:49 +080095 /*
96 * For each query type, the GPU will be asked to write the values of some
97 * registers to a buffer before and after a sequence of commands. We will
98 * compare the differences to get the query results.
99 */
Chia-I Wue18ff1b2014-08-07 13:38:51 +0800100 switch (info->queryType) {
Tony Barbour8205d902015-04-16 15:59:00 -0600101 case VK_QUERY_TYPE_OCCLUSION:
Chia-I Wu759fa2e2014-08-30 18:44:47 +0800102 query->slot_stride = u_align(sizeof(uint64_t) * 2, 64);
Chia-I Wue18ff1b2014-08-07 13:38:51 +0800103 break;
Tony Barbour8205d902015-04-16 15:59:00 -0600104 case VK_QUERY_TYPE_PIPELINE_STATISTICS:
Courtney Goeltzenleuchter29862812015-04-16 09:13:59 -0600105 query_init_pipeline_statistics(dev, info, query);
Chia-I Wue18ff1b2014-08-07 13:38:51 +0800106 break;
107 default:
Tobin Ehlis8b4f1672015-09-21 11:23:11 -0600108 assert(!"unknown query type");
Chia-I Wue18ff1b2014-08-07 13:38:51 +0800109 break;
110 }
111
Tony Barbour2094dc72015-07-09 15:26:32 -0600112 VkMemoryAllocInfo mem_reqs;
113 mem_reqs.sType = VK_STRUCTURE_TYPE_MEMORY_ALLOC_INFO;
114 mem_reqs.allocationSize = query->slot_stride * query->slot_count;
115 mem_reqs.pNext = NULL;
116 mem_reqs.memoryTypeIndex = 0;
117 intel_mem_alloc(dev, &mem_reqs, &query->obj.mem);
118
Chia-I Wue18ff1b2014-08-07 13:38:51 +0800119 query->obj.destroy = query_destroy;
120
121 *query_ret = query;
122
Courtney Goeltzenleuchter9cc421e2015-04-08 15:36:08 -0600123 return VK_SUCCESS;
Chia-I Wue18ff1b2014-08-07 13:38:51 +0800124}
125
126void intel_query_destroy(struct intel_query *query)
127{
128 intel_base_destroy(&query->obj.base);
129}
130
Chia-I Wu659650f2014-08-07 14:11:49 +0800131static void
132query_process_occlusion(const struct intel_query *query,
Mark Lobodzinskie2d07a52015-01-29 08:55:56 -0600133 uint32_t count, const uint8_t *raw,
Chia-I Wu659650f2014-08-07 14:11:49 +0800134 uint64_t *results)
135{
Mark Lobodzinskie2d07a52015-01-29 08:55:56 -0600136 uint32_t i;
Chia-I Wu659650f2014-08-07 14:11:49 +0800137
138 for (i = 0; i < count; i++) {
139 const uint32_t *pair = (const uint32_t *) raw;
140
141 results[i] = pair[1] - pair[0];
142 raw += query->slot_stride;
143 }
144}
145
146static void
147query_process_pipeline_statistics(const struct intel_query *query,
Mark Lobodzinskie2d07a52015-01-29 08:55:56 -0600148 uint32_t count, const uint8_t *raw,
Courtney Goeltzenleuchter29862812015-04-16 09:13:59 -0600149 void *results)
Chia-I Wu659650f2014-08-07 14:11:49 +0800150{
Courtney Goeltzenleuchter29862812015-04-16 09:13:59 -0600151 const uint32_t num_regs = query->reg_count;
Mark Lobodzinskie2d07a52015-01-29 08:55:56 -0600152 uint32_t i, j;
Chia-I Wu659650f2014-08-07 14:11:49 +0800153
154 for (i = 0; i < count; i++) {
155 const uint64_t *before = (const uint64_t *) raw;
156 const uint64_t *after = before + num_regs;
157 uint64_t *dst = (uint64_t *) (results + i);
158
159 for (j = 0; j < num_regs; j++)
160 dst[j] = after[j] - before[j];
161
162 raw += query->slot_stride;
163 }
164}
165
Courtney Goeltzenleuchter382489d2015-04-10 08:34:15 -0600166VkResult intel_query_get_results(struct intel_query *query,
Courtney Goeltzenleuchter29862812015-04-16 09:13:59 -0600167 uint32_t slot_start, uint32_t slot_count,
168 void *results)
Chia-I Wue18ff1b2014-08-07 13:38:51 +0800169{
170 const uint8_t *ptr;
Chia-I Wue18ff1b2014-08-07 13:38:51 +0800171
Chia-I Wue18ff1b2014-08-07 13:38:51 +0800172 if (intel_mem_is_busy(query->obj.mem))
Courtney Goeltzenleuchter9cc421e2015-04-08 15:36:08 -0600173 return VK_NOT_READY;
Chia-I Wue18ff1b2014-08-07 13:38:51 +0800174
175 ptr = (const uint8_t *) intel_mem_map_sync(query->obj.mem, false);
176 if (!ptr)
Courtney Goeltzenleuchter9cc421e2015-04-08 15:36:08 -0600177 return VK_ERROR_MEMORY_MAP_FAILED;
Chia-I Wue18ff1b2014-08-07 13:38:51 +0800178
179 ptr += query->obj.offset + query->slot_stride * slot_start;
180
181 switch (query->type) {
Tony Barbour8205d902015-04-16 15:59:00 -0600182 case VK_QUERY_TYPE_OCCLUSION:
Chia-I Wu659650f2014-08-07 14:11:49 +0800183 query_process_occlusion(query, slot_count, ptr, results);
Chia-I Wue18ff1b2014-08-07 13:38:51 +0800184 break;
Tony Barbour8205d902015-04-16 15:59:00 -0600185 case VK_QUERY_TYPE_PIPELINE_STATISTICS:
Chia-I Wu659650f2014-08-07 14:11:49 +0800186 query_process_pipeline_statistics(query, slot_count, ptr, results);
Chia-I Wue18ff1b2014-08-07 13:38:51 +0800187 break;
188 default:
189 assert(0);
190 break;
191 }
192
193 intel_mem_unmap(query->obj.mem);
194
Courtney Goeltzenleuchter9cc421e2015-04-08 15:36:08 -0600195 return VK_SUCCESS;
Chia-I Wue18ff1b2014-08-07 13:38:51 +0800196}
197
Courtney Goeltzenleuchter382489d2015-04-10 08:34:15 -0600198ICD_EXPORT VkResult VKAPI vkCreateQueryPool(
Courtney Goeltzenleuchter29862812015-04-16 09:13:59 -0600199 VkDevice device,
200 const VkQueryPoolCreateInfo* pCreateInfo,
201 VkQueryPool* pQueryPool)
Chia-I Wue18ff1b2014-08-07 13:38:51 +0800202{
Chia-I Wuf667a6a2014-08-07 14:15:01 +0800203 struct intel_dev *dev = intel_dev(device);
204
205 return intel_query_create(dev, pCreateInfo,
206 (struct intel_query **) pQueryPool);
Chia-I Wue18ff1b2014-08-07 13:38:51 +0800207}
208
Mark Lobodzinski67b42b72015-09-07 13:59:43 -0600209ICD_EXPORT void VKAPI vkDestroyQueryPool(
Tony Barbourde4124d2015-07-03 10:33:54 -0600210 VkDevice device,
211 VkQueryPool queryPool)
212
213 {
214 struct intel_obj *obj = intel_obj(queryPool.handle);
215
216 obj->destroy(obj);
Tony Barbourde4124d2015-07-03 10:33:54 -0600217 }
218
Courtney Goeltzenleuchter382489d2015-04-10 08:34:15 -0600219ICD_EXPORT VkResult VKAPI vkGetQueryPoolResults(
Mike Stroyan230e6252015-04-17 12:36:38 -0600220 VkDevice device,
Courtney Goeltzenleuchter29862812015-04-16 09:13:59 -0600221 VkQueryPool queryPool,
Mark Lobodzinskie2d07a52015-01-29 08:55:56 -0600222 uint32_t startQuery,
223 uint32_t queryCount,
224 size_t* pDataSize,
Tony Barbour8205d902015-04-16 15:59:00 -0600225 void* pData,
226 VkQueryResultFlags flags)
Chia-I Wue18ff1b2014-08-07 13:38:51 +0800227{
Chia-I Wuf667a6a2014-08-07 14:15:01 +0800228 struct intel_query *query = intel_query(queryPool);
229
230 switch (query->type) {
Tony Barbour8205d902015-04-16 15:59:00 -0600231 case VK_QUERY_TYPE_OCCLUSION:
Chia-I Wuf667a6a2014-08-07 14:15:01 +0800232 *pDataSize = sizeof(uint64_t) * queryCount;
233 break;
Tony Barbour8205d902015-04-16 15:59:00 -0600234 case VK_QUERY_TYPE_PIPELINE_STATISTICS:
Courtney Goeltzenleuchter29862812015-04-16 09:13:59 -0600235 *pDataSize = query->slot_stride * queryCount;
Chia-I Wuf667a6a2014-08-07 14:15:01 +0800236 break;
237 default:
Tobin Ehlis8b4f1672015-09-21 11:23:11 -0600238 assert(!"unknown query type");
Chia-I Wuf667a6a2014-08-07 14:15:01 +0800239 break;
240 }
241
242 if (pData)
243 return intel_query_get_results(query, startQuery, queryCount, pData);
244 else
Courtney Goeltzenleuchter9cc421e2015-04-08 15:36:08 -0600245 return VK_SUCCESS;
Chia-I Wue18ff1b2014-08-07 13:38:51 +0800246}