blob: 4d9daf784b610d75047aa26bffb03d625ac165ba [file] [log] [blame]
Chia-I Wu09142132014-08-11 15:42:55 +08001/*
2 * XGL
3 *
4 * Copyright (C) 2014 LunarG, Inc.
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the "Software"),
8 * to deal in the Software without restriction, including without limitation
9 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
10 * and/or sell copies of the Software, and to permit persons to whom the
11 * Software is furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice shall be included
14 * in all copies or substantial portions of the Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
21 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
22 * DEALINGS IN THE SOFTWARE.
Chia-I Wu44e42362014-09-02 08:32:09 +080023 *
24 * Authors:
25 * Chia-I Wu <olv@lunarg.com>
26 * Courtney Goeltzenleuchter <courtney@lunarg.com>
Chia-I Wu09142132014-08-11 15:42:55 +080027 */
28
29#ifndef CMD_H
30#define CMD_H
31
32#include "intel.h"
33#include "obj.h"
Chia-I Wub2755562014-08-20 13:38:52 +080034#include "view.h"
35
36struct intel_pipeline;
Chia-I Wuf2b6d722014-09-02 08:52:27 +080037struct intel_pipeline_shader;
Chia-I Wub2755562014-08-20 13:38:52 +080038struct intel_pipeline_delta;
39struct intel_viewport_state;
40struct intel_raster_state;
41struct intel_msaa_state;
42struct intel_blend_state;
43struct intel_ds_state;
44struct intel_dset;
45
Chia-I Wu958d1b72014-08-21 11:28:11 +080046struct intel_cmd_reloc;
47
Chia-I Wu8370b402014-08-29 12:28:37 +080048/*
49 * We know what workarounds are needed for intel_pipeline. These are mostly
50 * for intel_pipeline_delta.
51 */
52enum intel_cmd_wa_flags {
53 /*
54 * From the Sandy Bridge PRM, volume 2 part 1, page 60:
55 *
56 * "Before any depth stall flush (including those produced by
57 * non-pipelined state commands), software needs to first send a
58 * PIPE_CONTROL with no bits set except Post-Sync Operation != 0."
59 */
60 INTEL_CMD_WA_GEN6_PRE_DEPTH_STALL_WRITE = 1 << 0,
61
62 /*
63 * From the Sandy Bridge PRM, volume 2 part 1, page 274:
64 *
65 * "A PIPE_CONTROL command, with only the Stall At Pixel Scoreboard
66 * field set (DW1 Bit 1), must be issued prior to any change to the
67 * value in this field (Maximum Number of Threads in 3DSTATE_WM)"
68 *
69 * From the Ivy Bridge PRM, volume 2 part 1, page 286:
70 *
71 * "If this field (Maximum Number of Threads in 3DSTATE_PS) is changed
72 * between 3DPRIMITIVE commands, a PIPE_CONTROL command with Stall at
73 * Pixel Scoreboard set is required to be issued."
74 */
75 INTEL_CMD_WA_GEN6_PRE_COMMAND_SCOREBOARD_STALL = 1 << 1,
76
77 /*
78 * From the Ivy Bridge PRM, volume 2 part 1, page 106:
79 *
80 * "A PIPE_CONTROL with Post-Sync Operation set to 1h and a depth
81 * stall needs to be sent just prior to any 3DSTATE_VS,
82 * 3DSTATE_URB_VS, 3DSTATE_CONSTANT_VS,
83 * 3DSTATE_BINDING_TABLE_POINTER_VS, 3DSTATE_SAMPLER_STATE_POINTER_VS
84 * command. Only one PIPE_CONTROL needs to be sent before any
85 * combination of VS associated 3DSTATE."
86 */
87 INTEL_CMD_WA_GEN7_PRE_VS_DEPTH_STALL_WRITE = 1 << 2,
88
89 /*
90 * From the Ivy Bridge PRM, volume 2 part 1, page 258:
91 *
92 * "Due to an HW issue driver needs to send a pipe control with stall
93 * when ever there is state change in depth bias related state"
94 *
95 * From the Ivy Bridge PRM, volume 2 part 1, page 292:
96 *
97 * "A PIPE_CONTOL command with the CS Stall bit set must be programmed
98 * in the ring after this instruction
99 * (3DSTATE_PUSH_CONSTANT_ALLOC_PS)."
100 */
101 INTEL_CMD_WA_GEN7_POST_COMMAND_CS_STALL = 1 << 3,
102
103 /*
104 * From the Ivy Bridge PRM, volume 2 part 1, page 276:
105 *
106 * "The driver must make sure a PIPE_CONTROL with the Depth Stall
107 * Enable bit set after all the following states are programmed:
108 *
109 * - 3DSTATE_PS
110 * - 3DSTATE_VIEWPORT_STATE_POINTERS_CC
111 * - 3DSTATE_CONSTANT_PS
112 * - 3DSTATE_BINDING_TABLE_POINTERS_PS
113 * - 3DSTATE_SAMPLER_STATE_POINTERS_PS
114 * - 3DSTATE_CC_STATE_POINTERS
115 * - 3DSTATE_BLEND_STATE_POINTERS
116 * - 3DSTATE_DEPTH_STENCIL_STATE_POINTERS"
117 */
118 INTEL_CMD_WA_GEN7_POST_COMMAND_DEPTH_STALL = 1 << 4,
119};
120
Chia-I Wu68f319d2014-09-09 09:43:21 +0800121enum intel_cmd_writer_type {
122 INTEL_CMD_WRITER_BATCH,
123 INTEL_CMD_WRITER_STATE,
124 INTEL_CMD_WRITER_INSTRUCTION,
125
126 INTEL_CMD_WRITER_COUNT,
127};
128
Courtney Goeltzenleuchterd85c1d62014-08-27 14:04:53 -0600129struct intel_cmd_shader {
Chia-I Wuf2b6d722014-09-02 08:52:27 +0800130 const struct intel_pipeline_shader *shader;
Courtney Goeltzenleuchterd85c1d62014-08-27 14:04:53 -0600131 XGL_UINT kernel_pos;
132};
133
Chia-I Wub2755562014-08-20 13:38:52 +0800134/*
135 * States bounded to the command buffer. We want to write states directly to
136 * the command buffer when possible, and reduce this struct.
137 */
138struct intel_cmd_bind {
139 struct {
140 const struct intel_pipeline *graphics;
141 const struct intel_pipeline *compute;
142 const struct intel_pipeline_delta *graphics_delta;
143 const struct intel_pipeline_delta *compute_delta;
144 } pipeline;
145
Courtney Goeltzenleuchterba305812014-08-28 17:27:47 -0600146 /*
147 * Currently active shaders for this command buffer.
148 * Provides data only available after shaders are bound to
149 * a command buffer, such as the kernel position in the kernel BO
150 */
151 struct intel_cmd_shader vs;
152 struct intel_cmd_shader fs;
153 struct intel_cmd_shader gs;
Chia-I Wu95959fb2014-09-02 11:01:03 +0800154 struct intel_cmd_shader tcs;
155 struct intel_cmd_shader tes;
156 struct intel_cmd_shader cs;
Courtney Goeltzenleuchterba305812014-08-28 17:27:47 -0600157
Chia-I Wub2755562014-08-20 13:38:52 +0800158 struct {
Chia-I Wu338fe642014-08-28 10:43:04 +0800159 XGL_UINT count;
160 XGL_UINT used;
161 struct intel_cmd_shader *shaderArray;
Courtney Goeltzenleuchterd85c1d62014-08-27 14:04:53 -0600162 } shaderCache;
163
164 struct {
Chia-I Wub2755562014-08-20 13:38:52 +0800165 const struct intel_viewport_state *viewport;
166 const struct intel_raster_state *raster;
167 const struct intel_msaa_state *msaa;
168 const struct intel_blend_state *blend;
169 const struct intel_ds_state *ds;
170 } state;
171
172 struct {
173 const struct intel_dset *graphics;
174 XGL_UINT graphics_offset;
175 const struct intel_dset *compute;
176 XGL_UINT compute_offset;
177 } dset;
178
179 struct {
180 struct intel_mem_view graphics;
181 struct intel_mem_view compute;
Chia-I Wu9f1722c2014-08-25 10:17:58 +0800182 } dyn_view;
Chia-I Wub2755562014-08-20 13:38:52 +0800183
184 struct {
185 const struct intel_mem *mem;
186 XGL_GPU_SIZE offset;
187 XGL_INDEX_TYPE type;
188 } index;
189
190 struct {
191 const struct intel_rt_view *rt[XGL_MAX_COLOR_ATTACHMENTS];
192 XGL_UINT rt_count;
193
194 const struct intel_ds_view *ds;
195 } att;
Chia-I Wu48c283d2014-08-25 23:13:46 +0800196
Chia-I Wu707a29e2014-08-27 12:51:47 +0800197 XGL_UINT draw_count;
Chia-I Wu48c283d2014-08-25 23:13:46 +0800198 uint32_t wa_flags;
Chia-I Wub2755562014-08-20 13:38:52 +0800199};
Chia-I Wu09142132014-08-11 15:42:55 +0800200
Chia-I Wue24c3292014-08-21 14:05:23 +0800201struct intel_cmd_writer {
202 struct intel_bo *bo;
Chia-I Wu0f50ba82014-09-09 10:25:46 +0800203 void *ptr;
Chia-I Wue24c3292014-08-21 14:05:23 +0800204
205 /* in DWords */
206 XGL_UINT size;
207 XGL_UINT used;
208};
209
Chia-I Wu730e5362014-08-19 12:15:09 +0800210struct intel_cmd {
211 struct intel_obj obj;
212
213 struct intel_dev *dev;
Chia-I Wu0b784442014-08-25 22:54:16 +0800214 struct intel_bo *scratch_bo;
Chia-I Wu63883292014-08-25 13:50:26 +0800215 int pipeline_select;
Chia-I Wu730e5362014-08-19 12:15:09 +0800216
Chia-I Wu343b1372014-08-20 16:39:20 +0800217 struct intel_cmd_reloc *relocs;
218 XGL_UINT reloc_count;
219
Chia-I Wu730e5362014-08-19 12:15:09 +0800220 XGL_FLAGS flags;
221
Chia-I Wu68f319d2014-09-09 09:43:21 +0800222 struct intel_cmd_writer writers[INTEL_CMD_WRITER_COUNT];
Chia-I Wu730e5362014-08-19 12:15:09 +0800223
Chia-I Wu343b1372014-08-20 16:39:20 +0800224 XGL_UINT reloc_used;
Chia-I Wu04966702014-08-20 15:05:03 +0800225 XGL_RESULT result;
Chia-I Wub2755562014-08-20 13:38:52 +0800226
227 struct intel_cmd_bind bind;
Chia-I Wu730e5362014-08-19 12:15:09 +0800228};
229
230static inline struct intel_cmd *intel_cmd(XGL_CMD_BUFFER cmd)
231{
232 return (struct intel_cmd *) cmd;
233}
234
235static inline struct intel_cmd *intel_cmd_from_obj(struct intel_obj *obj)
236{
237 return (struct intel_cmd *) obj;
238}
239
240XGL_RESULT intel_cmd_create(struct intel_dev *dev,
241 const XGL_CMD_BUFFER_CREATE_INFO *info,
242 struct intel_cmd **cmd_ret);
243void intel_cmd_destroy(struct intel_cmd *cmd);
244
245XGL_RESULT intel_cmd_begin(struct intel_cmd *cmd, XGL_FLAGS flags);
246XGL_RESULT intel_cmd_end(struct intel_cmd *cmd);
247
Chia-I Wue24c3292014-08-21 14:05:23 +0800248static inline struct intel_bo *intel_cmd_get_batch(const struct intel_cmd *cmd,
249 XGL_GPU_SIZE *used)
250{
Chia-I Wu68f319d2014-09-09 09:43:21 +0800251 const struct intel_cmd_writer *writer =
252 &cmd->writers[INTEL_CMD_WRITER_BATCH];
Chia-I Wue24c3292014-08-21 14:05:23 +0800253
254 if (used)
255 *used = sizeof(uint32_t) * writer->used;
256
257 return writer->bo;
258}
259
Chia-I Wu09142132014-08-11 15:42:55 +0800260XGL_RESULT XGLAPI intelCreateCommandBuffer(
261 XGL_DEVICE device,
262 const XGL_CMD_BUFFER_CREATE_INFO* pCreateInfo,
263 XGL_CMD_BUFFER* pCmdBuffer);
264
265XGL_RESULT XGLAPI intelBeginCommandBuffer(
266 XGL_CMD_BUFFER cmdBuffer,
267 XGL_FLAGS flags);
268
269XGL_RESULT XGLAPI intelEndCommandBuffer(
270 XGL_CMD_BUFFER cmdBuffer);
271
272XGL_RESULT XGLAPI intelResetCommandBuffer(
273 XGL_CMD_BUFFER cmdBuffer);
274
275XGL_VOID XGLAPI intelCmdBindPipeline(
276 XGL_CMD_BUFFER cmdBuffer,
277 XGL_PIPELINE_BIND_POINT pipelineBindPoint,
278 XGL_PIPELINE pipeline);
279
280XGL_VOID XGLAPI intelCmdBindPipelineDelta(
281 XGL_CMD_BUFFER cmdBuffer,
282 XGL_PIPELINE_BIND_POINT pipelineBindPoint,
283 XGL_PIPELINE_DELTA delta);
284
285XGL_VOID XGLAPI intelCmdBindStateObject(
286 XGL_CMD_BUFFER cmdBuffer,
287 XGL_STATE_BIND_POINT stateBindPoint,
288 XGL_STATE_OBJECT state);
289
290XGL_VOID XGLAPI intelCmdBindDescriptorSet(
291 XGL_CMD_BUFFER cmdBuffer,
292 XGL_PIPELINE_BIND_POINT pipelineBindPoint,
293 XGL_UINT index,
294 XGL_DESCRIPTOR_SET descriptorSet,
295 XGL_UINT slotOffset);
296
297XGL_VOID XGLAPI intelCmdBindDynamicMemoryView(
298 XGL_CMD_BUFFER cmdBuffer,
299 XGL_PIPELINE_BIND_POINT pipelineBindPoint,
300 const XGL_MEMORY_VIEW_ATTACH_INFO* pMemView);
301
302XGL_VOID XGLAPI intelCmdBindIndexData(
303 XGL_CMD_BUFFER cmdBuffer,
304 XGL_GPU_MEMORY mem,
305 XGL_GPU_SIZE offset,
306 XGL_INDEX_TYPE indexType);
307
308XGL_VOID XGLAPI intelCmdBindAttachments(
309 XGL_CMD_BUFFER cmdBuffer,
310 XGL_UINT colorAttachmentCount,
311 const XGL_COLOR_ATTACHMENT_BIND_INFO* pColorAttachments,
312 const XGL_DEPTH_STENCIL_BIND_INFO* pDepthStencilAttachment);
313
314XGL_VOID XGLAPI intelCmdPrepareMemoryRegions(
315 XGL_CMD_BUFFER cmdBuffer,
316 XGL_UINT transitionCount,
317 const XGL_MEMORY_STATE_TRANSITION* pStateTransitions);
318
319XGL_VOID XGLAPI intelCmdPrepareImages(
320 XGL_CMD_BUFFER cmdBuffer,
321 XGL_UINT transitionCount,
322 const XGL_IMAGE_STATE_TRANSITION* pStateTransitions);
323
324XGL_VOID XGLAPI intelCmdDraw(
325 XGL_CMD_BUFFER cmdBuffer,
326 XGL_UINT firstVertex,
327 XGL_UINT vertexCount,
328 XGL_UINT firstInstance,
329 XGL_UINT instanceCount);
330
331XGL_VOID XGLAPI intelCmdDrawIndexed(
332 XGL_CMD_BUFFER cmdBuffer,
333 XGL_UINT firstIndex,
334 XGL_UINT indexCount,
335 XGL_INT vertexOffset,
336 XGL_UINT firstInstance,
337 XGL_UINT instanceCount);
338
339XGL_VOID XGLAPI intelCmdDrawIndirect(
340 XGL_CMD_BUFFER cmdBuffer,
341 XGL_GPU_MEMORY mem,
342 XGL_GPU_SIZE offset,
343 XGL_UINT32 count,
344 XGL_UINT32 stride);
345
346XGL_VOID XGLAPI intelCmdDrawIndexedIndirect(
347 XGL_CMD_BUFFER cmdBuffer,
348 XGL_GPU_MEMORY mem,
349 XGL_GPU_SIZE offset,
350 XGL_UINT32 count,
351 XGL_UINT32 stride);
352
353XGL_VOID XGLAPI intelCmdDispatch(
354 XGL_CMD_BUFFER cmdBuffer,
355 XGL_UINT x,
356 XGL_UINT y,
357 XGL_UINT z);
358
359XGL_VOID XGLAPI intelCmdDispatchIndirect(
360 XGL_CMD_BUFFER cmdBuffer,
361 XGL_GPU_MEMORY mem,
362 XGL_GPU_SIZE offset);
363
364XGL_VOID XGLAPI intelCmdCopyMemory(
365 XGL_CMD_BUFFER cmdBuffer,
366 XGL_GPU_MEMORY srcMem,
367 XGL_GPU_MEMORY destMem,
368 XGL_UINT regionCount,
369 const XGL_MEMORY_COPY* pRegions);
370
371XGL_VOID XGLAPI intelCmdCopyImage(
372 XGL_CMD_BUFFER cmdBuffer,
373 XGL_IMAGE srcImage,
374 XGL_IMAGE destImage,
375 XGL_UINT regionCount,
376 const XGL_IMAGE_COPY* pRegions);
377
378XGL_VOID XGLAPI intelCmdCopyMemoryToImage(
379 XGL_CMD_BUFFER cmdBuffer,
380 XGL_GPU_MEMORY srcMem,
381 XGL_IMAGE destImage,
382 XGL_UINT regionCount,
383 const XGL_MEMORY_IMAGE_COPY* pRegions);
384
385XGL_VOID XGLAPI intelCmdCopyImageToMemory(
386 XGL_CMD_BUFFER cmdBuffer,
387 XGL_IMAGE srcImage,
388 XGL_GPU_MEMORY destMem,
389 XGL_UINT regionCount,
390 const XGL_MEMORY_IMAGE_COPY* pRegions);
391
392XGL_VOID XGLAPI intelCmdCloneImageData(
393 XGL_CMD_BUFFER cmdBuffer,
394 XGL_IMAGE srcImage,
395 XGL_IMAGE_STATE srcImageState,
396 XGL_IMAGE destImage,
397 XGL_IMAGE_STATE destImageState);
398
399XGL_VOID XGLAPI intelCmdUpdateMemory(
400 XGL_CMD_BUFFER cmdBuffer,
401 XGL_GPU_MEMORY destMem,
402 XGL_GPU_SIZE destOffset,
403 XGL_GPU_SIZE dataSize,
404 const XGL_UINT32* pData);
405
406XGL_VOID XGLAPI intelCmdFillMemory(
407 XGL_CMD_BUFFER cmdBuffer,
408 XGL_GPU_MEMORY destMem,
409 XGL_GPU_SIZE destOffset,
410 XGL_GPU_SIZE fillSize,
411 XGL_UINT32 data);
412
413XGL_VOID XGLAPI intelCmdClearColorImage(
414 XGL_CMD_BUFFER cmdBuffer,
415 XGL_IMAGE image,
416 const XGL_FLOAT color[4],
417 XGL_UINT rangeCount,
418 const XGL_IMAGE_SUBRESOURCE_RANGE* pRanges);
419
420XGL_VOID XGLAPI intelCmdClearColorImageRaw(
421 XGL_CMD_BUFFER cmdBuffer,
422 XGL_IMAGE image,
423 const XGL_UINT32 color[4],
424 XGL_UINT rangeCount,
425 const XGL_IMAGE_SUBRESOURCE_RANGE* pRanges);
426
427XGL_VOID XGLAPI intelCmdClearDepthStencil(
428 XGL_CMD_BUFFER cmdBuffer,
429 XGL_IMAGE image,
430 XGL_FLOAT depth,
431 XGL_UINT32 stencil,
432 XGL_UINT rangeCount,
433 const XGL_IMAGE_SUBRESOURCE_RANGE* pRanges);
434
435XGL_VOID XGLAPI intelCmdResolveImage(
436 XGL_CMD_BUFFER cmdBuffer,
437 XGL_IMAGE srcImage,
438 XGL_IMAGE destImage,
439 XGL_UINT rectCount,
440 const XGL_IMAGE_RESOLVE* pRects);
441
442XGL_VOID XGLAPI intelCmdSetEvent(
443 XGL_CMD_BUFFER cmdBuffer,
444 XGL_EVENT event);
445
446XGL_VOID XGLAPI intelCmdResetEvent(
447 XGL_CMD_BUFFER cmdBuffer,
448 XGL_EVENT event);
449
450XGL_VOID XGLAPI intelCmdMemoryAtomic(
451 XGL_CMD_BUFFER cmdBuffer,
452 XGL_GPU_MEMORY destMem,
453 XGL_GPU_SIZE destOffset,
454 XGL_UINT64 srcData,
455 XGL_ATOMIC_OP atomicOp);
456
457XGL_VOID XGLAPI intelCmdBeginQuery(
458 XGL_CMD_BUFFER cmdBuffer,
459 XGL_QUERY_POOL queryPool,
460 XGL_UINT slot,
461 XGL_FLAGS flags);
462
463XGL_VOID XGLAPI intelCmdEndQuery(
464 XGL_CMD_BUFFER cmdBuffer,
465 XGL_QUERY_POOL queryPool,
466 XGL_UINT slot);
467
468XGL_VOID XGLAPI intelCmdResetQueryPool(
469 XGL_CMD_BUFFER cmdBuffer,
470 XGL_QUERY_POOL queryPool,
471 XGL_UINT startQuery,
472 XGL_UINT queryCount);
473
474XGL_VOID XGLAPI intelCmdWriteTimestamp(
475 XGL_CMD_BUFFER cmdBuffer,
476 XGL_TIMESTAMP_TYPE timestampType,
477 XGL_GPU_MEMORY destMem,
478 XGL_GPU_SIZE destOffset);
479
480XGL_VOID XGLAPI intelCmdInitAtomicCounters(
481 XGL_CMD_BUFFER cmdBuffer,
482 XGL_PIPELINE_BIND_POINT pipelineBindPoint,
483 XGL_UINT startCounter,
484 XGL_UINT counterCount,
485 const XGL_UINT32* pData);
486
487XGL_VOID XGLAPI intelCmdLoadAtomicCounters(
488 XGL_CMD_BUFFER cmdBuffer,
489 XGL_PIPELINE_BIND_POINT pipelineBindPoint,
490 XGL_UINT startCounter,
491 XGL_UINT counterCount,
492 XGL_GPU_MEMORY srcMem,
493 XGL_GPU_SIZE srcOffset);
494
495XGL_VOID XGLAPI intelCmdSaveAtomicCounters(
496 XGL_CMD_BUFFER cmdBuffer,
497 XGL_PIPELINE_BIND_POINT pipelineBindPoint,
498 XGL_UINT startCounter,
499 XGL_UINT counterCount,
500 XGL_GPU_MEMORY destMem,
501 XGL_GPU_SIZE destOffset);
502
503XGL_VOID XGLAPI intelCmdDbgMarkerBegin(
504 XGL_CMD_BUFFER cmdBuffer,
505 const XGL_CHAR* pMarker);
506
507XGL_VOID XGLAPI intelCmdDbgMarkerEnd(
508 XGL_CMD_BUFFER cmdBuffer);
509
510#endif /* CMD_H */