blob: dcb604843fe9ac9650613f0a3d0fc599843e3967 [file] [log] [blame]
Chia-I Wub2755562014-08-20 13:38:52 +08001/*
2 * XGL
3 *
4 * Copyright (C) 2014 LunarG, Inc.
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the "Software"),
8 * to deal in the Software without restriction, including without limitation
9 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
10 * and/or sell copies of the Software, and to permit persons to whom the
11 * Software is furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice shall be included
14 * in all copies or substantial portions of the Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
21 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
22 * DEALINGS IN THE SOFTWARE.
23 */
24
Chia-I Wu9f039862014-08-20 15:39:56 +080025#include "genhw/genhw.h"
Chia-I Wub2755562014-08-20 13:38:52 +080026#include "dset.h"
Chia-I Wu7fae4e32014-08-21 11:39:44 +080027#include "img.h"
Chia-I Wub2755562014-08-20 13:38:52 +080028#include "mem.h"
Chia-I Wu018a3962014-08-21 10:37:52 +080029#include "pipeline.h"
Chia-I Wub2755562014-08-20 13:38:52 +080030#include "state.h"
31#include "view.h"
32#include "cmd_priv.h"
33
Chia-I Wu48c283d2014-08-25 23:13:46 +080034enum {
35 GEN6_WA_POST_SYNC_FLUSH = 1 << 0,
36 GEN6_WA_DS_FLUSH = 1 << 1,
37};
38
Chia-I Wu59c097e2014-08-21 10:51:07 +080039static void gen6_3DPRIMITIVE(struct intel_cmd *cmd,
Chia-I Wu254db422014-08-21 11:54:29 +080040 int prim_type, bool indexed,
Chia-I Wu59c097e2014-08-21 10:51:07 +080041 uint32_t vertex_count,
42 uint32_t vertex_start,
43 uint32_t instance_count,
44 uint32_t instance_start,
45 uint32_t vertex_base)
46{
47 const uint8_t cmd_len = 6;
48 uint32_t dw0;
49
50 CMD_ASSERT(cmd, 6, 6);
51
Chia-I Wu426072d2014-08-26 14:31:55 +080052 dw0 = GEN6_RENDER_CMD(3D, 3DPRIMITIVE) |
Chia-I Wu254db422014-08-21 11:54:29 +080053 prim_type << GEN6_3DPRIM_DW0_TYPE__SHIFT |
Chia-I Wu59c097e2014-08-21 10:51:07 +080054 (cmd_len - 2);
55
56 if (indexed)
57 dw0 |= GEN6_3DPRIM_DW0_ACCESS_RANDOM;
58
Chia-I Wue24c3292014-08-21 14:05:23 +080059 cmd_batch_reserve(cmd, cmd_len);
60 cmd_batch_write(cmd, dw0);
61 cmd_batch_write(cmd, vertex_count);
62 cmd_batch_write(cmd, vertex_start);
63 cmd_batch_write(cmd, instance_count);
64 cmd_batch_write(cmd, instance_start);
65 cmd_batch_write(cmd, vertex_base);
Chia-I Wu59c097e2014-08-21 10:51:07 +080066}
67
68static void gen7_3DPRIMITIVE(struct intel_cmd *cmd,
Chia-I Wu254db422014-08-21 11:54:29 +080069 int prim_type, bool indexed,
Chia-I Wu59c097e2014-08-21 10:51:07 +080070 uint32_t vertex_count,
71 uint32_t vertex_start,
72 uint32_t instance_count,
73 uint32_t instance_start,
74 uint32_t vertex_base)
75{
76 const uint8_t cmd_len = 7;
77 uint32_t dw0, dw1;
78
79 CMD_ASSERT(cmd, 7, 7.5);
80
Chia-I Wu426072d2014-08-26 14:31:55 +080081 dw0 = GEN6_RENDER_CMD(3D, 3DPRIMITIVE) | (cmd_len - 2);
Chia-I Wu254db422014-08-21 11:54:29 +080082 dw1 = prim_type << GEN7_3DPRIM_DW1_TYPE__SHIFT;
Chia-I Wu59c097e2014-08-21 10:51:07 +080083
84 if (indexed)
85 dw1 |= GEN7_3DPRIM_DW1_ACCESS_RANDOM;
86
Chia-I Wue24c3292014-08-21 14:05:23 +080087 cmd_batch_reserve(cmd, cmd_len);
88 cmd_batch_write(cmd, dw0);
89 cmd_batch_write(cmd, dw1);
90 cmd_batch_write(cmd, vertex_count);
91 cmd_batch_write(cmd, vertex_start);
92 cmd_batch_write(cmd, instance_count);
93 cmd_batch_write(cmd, instance_start);
94 cmd_batch_write(cmd, vertex_base);
Chia-I Wu59c097e2014-08-21 10:51:07 +080095}
96
Chia-I Wu270b1e82014-08-25 15:53:39 +080097static void gen6_PIPE_CONTROL(struct intel_cmd *cmd, uint32_t dw1,
98 struct intel_bo *bo, uint32_t bo_offset)
99{
100 const uint8_t cmd_len = 5;
Chia-I Wu426072d2014-08-26 14:31:55 +0800101 const uint32_t dw0 = GEN6_RENDER_CMD(3D, PIPE_CONTROL) |
Chia-I Wu270b1e82014-08-25 15:53:39 +0800102 (cmd_len - 2);
Chia-I Wu270b1e82014-08-25 15:53:39 +0800103
104 CMD_ASSERT(cmd, 6, 7.5);
105
106 assert(bo_offset % 8 == 0);
107
108 if (dw1 & GEN6_PIPE_CONTROL_CS_STALL) {
109 /*
110 * From the Sandy Bridge PRM, volume 2 part 1, page 73:
111 *
112 * "1 of the following must also be set (when CS stall is set):
113 *
114 * * Depth Cache Flush Enable ([0] of DW1)
115 * * Stall at Pixel Scoreboard ([1] of DW1)
116 * * Depth Stall ([13] of DW1)
117 * * Post-Sync Operation ([13] of DW1)
118 * * Render Target Cache Flush Enable ([12] of DW1)
119 * * Notify Enable ([8] of DW1)"
120 *
121 * From the Ivy Bridge PRM, volume 2 part 1, page 61:
122 *
123 * "One of the following must also be set (when CS stall is set):
124 *
125 * * Render Target Cache Flush Enable ([12] of DW1)
126 * * Depth Cache Flush Enable ([0] of DW1)
127 * * Stall at Pixel Scoreboard ([1] of DW1)
128 * * Depth Stall ([13] of DW1)
129 * * Post-Sync Operation ([13] of DW1)"
130 */
131 uint32_t bit_test = GEN6_PIPE_CONTROL_RENDER_CACHE_FLUSH |
132 GEN6_PIPE_CONTROL_DEPTH_CACHE_FLUSH |
133 GEN6_PIPE_CONTROL_PIXEL_SCOREBOARD_STALL |
134 GEN6_PIPE_CONTROL_DEPTH_STALL;
135
136 /* post-sync op */
137 bit_test |= GEN6_PIPE_CONTROL_WRITE_IMM |
138 GEN6_PIPE_CONTROL_WRITE_PS_DEPTH_COUNT |
139 GEN6_PIPE_CONTROL_WRITE_TIMESTAMP;
140
141 if (cmd_gen(cmd) == INTEL_GEN(6))
142 bit_test |= GEN6_PIPE_CONTROL_NOTIFY_ENABLE;
143
144 assert(dw1 & bit_test);
145 }
146
147 if (dw1 & GEN6_PIPE_CONTROL_DEPTH_STALL) {
148 /*
149 * From the Sandy Bridge PRM, volume 2 part 1, page 73:
150 *
151 * "Following bits must be clear (when Depth Stall is set):
152 *
153 * * Render Target Cache Flush Enable ([12] of DW1)
154 * * Depth Cache Flush Enable ([0] of DW1)"
155 */
156 assert(!(dw1 & (GEN6_PIPE_CONTROL_RENDER_CACHE_FLUSH |
157 GEN6_PIPE_CONTROL_DEPTH_CACHE_FLUSH)));
158 }
159
160 /*
161 * From the Sandy Bridge PRM, volume 1 part 3, page 19:
162 *
163 * "[DevSNB] PPGTT memory writes by MI_* (such as MI_STORE_DATA_IMM)
164 * and PIPE_CONTROL are not supported."
165 *
166 * The kernel will add the mapping automatically (when write domain is
167 * INTEL_DOMAIN_INSTRUCTION).
168 */
169 if (cmd_gen(cmd) == INTEL_GEN(6) && bo)
170 bo_offset |= GEN6_PIPE_CONTROL_DW2_USE_GGTT;
171
172 cmd_batch_reserve_reloc(cmd, cmd_len, (bool) bo);
173 cmd_batch_write(cmd, dw0);
174 cmd_batch_write(cmd, dw1);
Chia-I Wu32a22462014-08-26 14:13:46 +0800175 if (bo) {
176 cmd_batch_reloc(cmd, bo_offset, bo, INTEL_RELOC_GGTT |
177 INTEL_RELOC_WRITE);
178 } else {
Chia-I Wu270b1e82014-08-25 15:53:39 +0800179 cmd_batch_write(cmd, 0);
Chia-I Wu32a22462014-08-26 14:13:46 +0800180 }
Chia-I Wu270b1e82014-08-25 15:53:39 +0800181 cmd_batch_write(cmd, 0);
182 cmd_batch_write(cmd, 0);
183}
184
Chia-I Wu254db422014-08-21 11:54:29 +0800185static bool gen6_can_primitive_restart(const struct intel_cmd *cmd)
186{
187 const struct intel_pipeline *p = cmd->bind.pipeline.graphics;
188 bool supported;
189
190 CMD_ASSERT(cmd, 6, 7.5);
191
192 if (cmd_gen(cmd) >= INTEL_GEN(7.5))
193 return (p->prim_type != GEN6_3DPRIM_RECTLIST);
194
195 switch (p->prim_type) {
196 case GEN6_3DPRIM_POINTLIST:
197 case GEN6_3DPRIM_LINELIST:
198 case GEN6_3DPRIM_LINESTRIP:
199 case GEN6_3DPRIM_TRILIST:
200 case GEN6_3DPRIM_TRISTRIP:
201 supported = true;
202 break;
203 default:
204 supported = false;
205 break;
206 }
207
208 if (!supported)
209 return false;
210
211 switch (cmd->bind.index.type) {
212 case XGL_INDEX_8:
213 supported = (p->primitive_restart_index != 0xffu);
214 break;
215 case XGL_INDEX_16:
216 supported = (p->primitive_restart_index != 0xffffu);
217 break;
218 case XGL_INDEX_32:
219 supported = (p->primitive_restart_index != 0xffffffffu);
220 break;
221 default:
222 supported = false;
223 break;
224 }
225
226 return supported;
227}
228
Chia-I Wu59c097e2014-08-21 10:51:07 +0800229static void gen6_3DSTATE_INDEX_BUFFER(struct intel_cmd *cmd,
Chia-I Wu958d1b72014-08-21 11:28:11 +0800230 const struct intel_mem *mem,
Chia-I Wu59c097e2014-08-21 10:51:07 +0800231 XGL_GPU_SIZE offset,
232 XGL_INDEX_TYPE type,
233 bool enable_cut_index)
234{
235 const uint8_t cmd_len = 3;
236 uint32_t dw0, end_offset;
237 unsigned offset_align;
238
239 CMD_ASSERT(cmd, 6, 7.5);
240
Chia-I Wu426072d2014-08-26 14:31:55 +0800241 dw0 = GEN6_RENDER_CMD(3D, 3DSTATE_INDEX_BUFFER) | (cmd_len - 2);
Chia-I Wu59c097e2014-08-21 10:51:07 +0800242
243 /* the bit is moved to 3DSTATE_VF */
244 if (cmd_gen(cmd) >= INTEL_GEN(7.5))
245 assert(!enable_cut_index);
246 if (enable_cut_index)
247 dw0 |= GEN6_IB_DW0_CUT_INDEX_ENABLE;
248
249 switch (type) {
250 case XGL_INDEX_8:
251 dw0 |= GEN6_IB_DW0_FORMAT_BYTE;
252 offset_align = 1;
253 break;
254 case XGL_INDEX_16:
255 dw0 |= GEN6_IB_DW0_FORMAT_WORD;
256 offset_align = 2;
257 break;
258 case XGL_INDEX_32:
259 dw0 |= GEN6_IB_DW0_FORMAT_DWORD;
260 offset_align = 4;
261 break;
262 default:
263 cmd->result = XGL_ERROR_INVALID_VALUE;
264 return;
265 break;
266 }
267
268 if (offset % offset_align) {
269 cmd->result = XGL_ERROR_INVALID_VALUE;
270 return;
271 }
272
273 /* aligned and inclusive */
274 end_offset = mem->size - (mem->size % offset_align) - 1;
275
Chia-I Wu2de65d02014-08-25 10:02:53 +0800276 cmd_batch_reserve_reloc(cmd, cmd_len, 2);
Chia-I Wue24c3292014-08-21 14:05:23 +0800277 cmd_batch_write(cmd, dw0);
Chia-I Wu32a22462014-08-26 14:13:46 +0800278 cmd_batch_reloc(cmd, offset, mem->bo, 0);
279 cmd_batch_reloc(cmd, end_offset, mem->bo, 0);
Chia-I Wu59c097e2014-08-21 10:51:07 +0800280}
281
Chia-I Wu254db422014-08-21 11:54:29 +0800282static inline void
283gen75_3DSTATE_VF(struct intel_cmd *cmd,
284 bool enable_cut_index,
285 uint32_t cut_index)
286{
287 const uint8_t cmd_len = 2;
288 uint32_t dw0;
289
290 CMD_ASSERT(cmd, 7.5, 7.5);
291
Chia-I Wu426072d2014-08-26 14:31:55 +0800292 dw0 = GEN75_RENDER_CMD(3D, 3DSTATE_VF) | (cmd_len - 2);
Chia-I Wu254db422014-08-21 11:54:29 +0800293 if (enable_cut_index)
294 dw0 |= GEN75_VF_DW0_CUT_INDEX_ENABLE;
295
Chia-I Wue24c3292014-08-21 14:05:23 +0800296 cmd_batch_reserve(cmd, cmd_len);
297 cmd_batch_write(cmd, dw0);
298 cmd_batch_write(cmd, cut_index);
Chia-I Wu254db422014-08-21 11:54:29 +0800299}
300
Chia-I Wud88e02d2014-08-25 10:56:13 +0800301static void gen6_3DSTATE_DRAWING_RECTANGLE(struct intel_cmd *cmd,
302 XGL_UINT width, XGL_UINT height)
303{
304 const uint8_t cmd_len = 4;
Chia-I Wu426072d2014-08-26 14:31:55 +0800305 const uint32_t dw0 = GEN6_RENDER_CMD(3D, 3DSTATE_DRAWING_RECTANGLE) |
Chia-I Wud88e02d2014-08-25 10:56:13 +0800306 (cmd_len - 2);
307
308 CMD_ASSERT(cmd, 6, 7.5);
309
310 cmd_batch_reserve(cmd, cmd_len);
311 cmd_batch_write(cmd, dw0);
312 if (width && height) {
313 cmd_batch_write(cmd, 0);
314 cmd_batch_write(cmd, (height - 1) << 16 |
315 (width - 1));
316 } else {
317 cmd_batch_write(cmd, 1);
318 cmd_batch_write(cmd, 0);
319 }
320 cmd_batch_write(cmd, 0);
321}
322
Chia-I Wu7fae4e32014-08-21 11:39:44 +0800323static void gen6_3DSTATE_DEPTH_BUFFER(struct intel_cmd *cmd,
324 const struct intel_ds_view *view)
325{
326 const uint8_t cmd_len = 7;
327 uint32_t dw0;
328
329 CMD_ASSERT(cmd, 6, 7.5);
330
331 dw0 = (cmd_gen(cmd) >= INTEL_GEN(7)) ?
Chia-I Wu426072d2014-08-26 14:31:55 +0800332 GEN7_RENDER_CMD(3D, 3DSTATE_DEPTH_BUFFER) :
333 GEN6_RENDER_CMD(3D, 3DSTATE_DEPTH_BUFFER);
Chia-I Wu7fae4e32014-08-21 11:39:44 +0800334 dw0 |= (cmd_len - 2);
335
Chia-I Wu2de65d02014-08-25 10:02:53 +0800336 cmd_batch_reserve_reloc(cmd, cmd_len, (bool) view->img);
Chia-I Wue24c3292014-08-21 14:05:23 +0800337 cmd_batch_write(cmd, dw0);
338 cmd_batch_write(cmd, view->cmd[0]);
Courtney Goeltzenleuchtere316d972014-08-22 16:25:24 -0600339 if (view->img) {
Chia-I Wu9ee38722014-08-25 12:11:36 +0800340 cmd_batch_reloc(cmd, view->cmd[1], view->img->obj.mem->bo,
Chia-I Wu32a22462014-08-26 14:13:46 +0800341 INTEL_RELOC_WRITE);
Courtney Goeltzenleuchtere316d972014-08-22 16:25:24 -0600342 } else {
343 cmd_batch_write(cmd, 0);
344 }
Chia-I Wue24c3292014-08-21 14:05:23 +0800345 cmd_batch_write(cmd, view->cmd[2]);
346 cmd_batch_write(cmd, view->cmd[3]);
347 cmd_batch_write(cmd, view->cmd[4]);
348 cmd_batch_write(cmd, view->cmd[5]);
Chia-I Wu7fae4e32014-08-21 11:39:44 +0800349}
350
351static void gen6_3DSTATE_STENCIL_BUFFER(struct intel_cmd *cmd,
352 const struct intel_ds_view *view)
353{
354 const uint8_t cmd_len = 3;
355 uint32_t dw0;
356
357 CMD_ASSERT(cmd, 6, 7.5);
358
359 dw0 = (cmd_gen(cmd) >= INTEL_GEN(7)) ?
Chia-I Wu426072d2014-08-26 14:31:55 +0800360 GEN7_RENDER_CMD(3D, 3DSTATE_STENCIL_BUFFER) :
361 GEN6_RENDER_CMD(3D, 3DSTATE_STENCIL_BUFFER);
Chia-I Wu7fae4e32014-08-21 11:39:44 +0800362 dw0 |= (cmd_len - 2);
363
Chia-I Wu2de65d02014-08-25 10:02:53 +0800364 cmd_batch_reserve_reloc(cmd, cmd_len, (bool) view->img);
Chia-I Wue24c3292014-08-21 14:05:23 +0800365 cmd_batch_write(cmd, dw0);
366 cmd_batch_write(cmd, view->cmd[6]);
Courtney Goeltzenleuchtere316d972014-08-22 16:25:24 -0600367 if (view->img) {
Chia-I Wu9ee38722014-08-25 12:11:36 +0800368 cmd_batch_reloc(cmd, view->cmd[7], view->img->obj.mem->bo,
Chia-I Wu32a22462014-08-26 14:13:46 +0800369 INTEL_RELOC_WRITE);
Courtney Goeltzenleuchtere316d972014-08-22 16:25:24 -0600370 } else {
371 cmd_batch_write(cmd, 0);
372 }
Chia-I Wu7fae4e32014-08-21 11:39:44 +0800373}
374
375static void gen6_3DSTATE_HIER_DEPTH_BUFFER(struct intel_cmd *cmd,
376 const struct intel_ds_view *view)
377{
378 const uint8_t cmd_len = 3;
379 uint32_t dw0;
380
381 CMD_ASSERT(cmd, 6, 7.5);
382
383 dw0 = (cmd_gen(cmd) >= INTEL_GEN(7)) ?
Chia-I Wu426072d2014-08-26 14:31:55 +0800384 GEN7_RENDER_CMD(3D, 3DSTATE_HIER_DEPTH_BUFFER) :
385 GEN6_RENDER_CMD(3D, 3DSTATE_HIER_DEPTH_BUFFER);
Chia-I Wu7fae4e32014-08-21 11:39:44 +0800386 dw0 |= (cmd_len - 2);
387
Chia-I Wu2de65d02014-08-25 10:02:53 +0800388 cmd_batch_reserve_reloc(cmd, cmd_len, (bool) view->img);
Chia-I Wue24c3292014-08-21 14:05:23 +0800389 cmd_batch_write(cmd, dw0);
390 cmd_batch_write(cmd, view->cmd[8]);
Courtney Goeltzenleuchtere316d972014-08-22 16:25:24 -0600391 if (view->img) {
Chia-I Wu9ee38722014-08-25 12:11:36 +0800392 cmd_batch_reloc(cmd, view->cmd[9], view->img->obj.mem->bo,
Chia-I Wu32a22462014-08-26 14:13:46 +0800393 INTEL_RELOC_WRITE);
Courtney Goeltzenleuchtere316d972014-08-22 16:25:24 -0600394 } else {
395 cmd_batch_write(cmd, 0);
396 }
Chia-I Wu7fae4e32014-08-21 11:39:44 +0800397}
398
Chia-I Wuf8231032014-08-25 10:44:45 +0800399static void gen6_3DSTATE_CLEAR_PARAMS(struct intel_cmd *cmd,
400 uint32_t clear_val)
401{
402 const uint8_t cmd_len = 2;
Chia-I Wu426072d2014-08-26 14:31:55 +0800403 const uint32_t dw0 = GEN6_RENDER_CMD(3D, 3DSTATE_CLEAR_PARAMS) |
Chia-I Wuf8231032014-08-25 10:44:45 +0800404 GEN6_CLEAR_PARAMS_DW0_VALID |
405 (cmd_len - 2);
406
407 CMD_ASSERT(cmd, 6, 6);
408
409 cmd_batch_reserve(cmd, cmd_len);
410 cmd_batch_write(cmd, dw0);
411 cmd_batch_write(cmd, clear_val);
412}
413
414static void gen7_3DSTATE_CLEAR_PARAMS(struct intel_cmd *cmd,
415 uint32_t clear_val)
416{
417 const uint8_t cmd_len = 3;
Chia-I Wu426072d2014-08-26 14:31:55 +0800418 const uint32_t dw0 = GEN7_RENDER_CMD(3D, 3DSTATE_CLEAR_PARAMS) |
Chia-I Wuf8231032014-08-25 10:44:45 +0800419 (cmd_len - 2);
420
421 CMD_ASSERT(cmd, 7, 7.5);
422
423 cmd_batch_reserve(cmd, cmd_len);
424 cmd_batch_write(cmd, dw0);
425 cmd_batch_write(cmd, clear_val);
426 cmd_batch_write(cmd, 1);
427}
428
Chia-I Wu302742d2014-08-22 10:28:29 +0800429static void gen6_3DSTATE_CC_STATE_POINTERS(struct intel_cmd *cmd,
430 XGL_UINT blend_pos,
431 XGL_UINT ds_pos,
432 XGL_UINT cc_pos)
433{
434 const uint8_t cmd_len = 4;
435 uint32_t dw0;
436
437 CMD_ASSERT(cmd, 6, 6);
438
Chia-I Wu426072d2014-08-26 14:31:55 +0800439 dw0 = GEN6_RENDER_CMD(3D, 3DSTATE_CC_STATE_POINTERS) |
Chia-I Wu302742d2014-08-22 10:28:29 +0800440 (cmd_len - 2);
441
442 cmd_batch_reserve(cmd, cmd_len);
443 cmd_batch_write(cmd, dw0);
444 cmd_batch_write(cmd, (blend_pos << 2) | 1);
445 cmd_batch_write(cmd, (ds_pos << 2) | 1);
446 cmd_batch_write(cmd, (cc_pos << 2) | 1);
447}
448
Chia-I Wu1744cca2014-08-22 11:10:17 +0800449static void gen6_3DSTATE_VIEWPORT_STATE_POINTERS(struct intel_cmd *cmd,
450 XGL_UINT clip_pos,
451 XGL_UINT sf_pos,
452 XGL_UINT cc_pos)
453{
454 const uint8_t cmd_len = 4;
455 uint32_t dw0;
456
457 CMD_ASSERT(cmd, 6, 6);
458
Chia-I Wu426072d2014-08-26 14:31:55 +0800459 dw0 = GEN6_RENDER_CMD(3D, 3DSTATE_VIEWPORT_STATE_POINTERS) |
Chia-I Wu1744cca2014-08-22 11:10:17 +0800460 GEN6_PTR_VP_DW0_CLIP_CHANGED |
461 GEN6_PTR_VP_DW0_SF_CHANGED |
462 GEN6_PTR_VP_DW0_CC_CHANGED |
463 (cmd_len - 2);
464
465 cmd_batch_reserve(cmd, cmd_len);
466 cmd_batch_write(cmd, dw0);
467 cmd_batch_write(cmd, clip_pos << 2);
468 cmd_batch_write(cmd, sf_pos << 2);
469 cmd_batch_write(cmd, cc_pos << 2);
470}
471
472static void gen6_3DSTATE_SCISSOR_STATE_POINTERS(struct intel_cmd *cmd,
473 XGL_UINT scissor_pos)
474{
475 const uint8_t cmd_len = 2;
476 uint32_t dw0;
477
478 CMD_ASSERT(cmd, 6, 6);
479
Chia-I Wu426072d2014-08-26 14:31:55 +0800480 dw0 = GEN6_RENDER_CMD(3D, 3DSTATE_SCISSOR_STATE_POINTERS) |
Chia-I Wu1744cca2014-08-22 11:10:17 +0800481 (cmd_len - 2);
482
483 cmd_batch_reserve(cmd, cmd_len);
484 cmd_batch_write(cmd, dw0);
485 cmd_batch_write(cmd, scissor_pos << 2);
486}
487
Chia-I Wu42a56202014-08-23 16:47:48 +0800488static void gen6_3DSTATE_BINDING_TABLE_POINTERS(struct intel_cmd *cmd,
489 XGL_UINT vs_pos,
490 XGL_UINT gs_pos,
491 XGL_UINT ps_pos)
492{
493 const uint8_t cmd_len = 4;
494 uint32_t dw0;
495
496 CMD_ASSERT(cmd, 6, 6);
497
Chia-I Wu426072d2014-08-26 14:31:55 +0800498 dw0 = GEN6_RENDER_CMD(3D, 3DSTATE_BINDING_TABLE_POINTERS) |
Chia-I Wu42a56202014-08-23 16:47:48 +0800499 GEN6_PTR_BINDING_TABLE_DW0_VS_CHANGED |
500 GEN6_PTR_BINDING_TABLE_DW0_GS_CHANGED |
501 GEN6_PTR_BINDING_TABLE_DW0_PS_CHANGED |
502 (cmd_len - 2);
503
504 cmd_batch_reserve(cmd, cmd_len);
505 cmd_batch_write(cmd, dw0);
506 cmd_batch_write(cmd, vs_pos << 2);
507 cmd_batch_write(cmd, gs_pos << 2);
508 cmd_batch_write(cmd, ps_pos << 2);
509}
510
Chia-I Wu302742d2014-08-22 10:28:29 +0800511static void gen7_3dstate_pointer(struct intel_cmd *cmd,
512 int subop, XGL_UINT pos)
513{
514 const uint8_t cmd_len = 2;
515 const uint32_t dw0 = GEN6_RENDER_TYPE_RENDER |
516 GEN6_RENDER_SUBTYPE_3D |
517 subop | (cmd_len - 2);
518
519 cmd_batch_reserve(cmd, cmd_len);
520 cmd_batch_write(cmd, dw0);
521 cmd_batch_write(cmd, pos << 2);
522}
523
524static XGL_UINT gen6_BLEND_STATE(struct intel_cmd *cmd,
525 const struct intel_blend_state *state)
526{
527 const uint8_t cmd_align = GEN6_ALIGNMENT_BLEND_STATE;
528 const uint8_t cmd_len = XGL_MAX_COLOR_ATTACHMENTS * 2;
529
530 CMD_ASSERT(cmd, 6, 7.5);
531 STATIC_ASSERT(ARRAY_SIZE(state->cmd) >= cmd_len);
532
533 return cmd_state_copy(cmd, state->cmd, cmd_len, cmd_align);
534}
535
536static XGL_UINT gen6_DEPTH_STENCIL_STATE(struct intel_cmd *cmd,
537 const struct intel_ds_state *state)
538{
539 const uint8_t cmd_align = GEN6_ALIGNMENT_DEPTH_STENCIL_STATE;
540 const uint8_t cmd_len = 3;
541
542 CMD_ASSERT(cmd, 6, 7.5);
543 STATIC_ASSERT(ARRAY_SIZE(state->cmd) >= cmd_len);
544
545 return cmd_state_copy(cmd, state->cmd, cmd_len, cmd_align);
546}
547
548static XGL_UINT gen6_COLOR_CALC_STATE(struct intel_cmd *cmd,
549 uint32_t stencil_ref,
550 const uint32_t blend_color[4])
551{
552 const uint8_t cmd_align = GEN6_ALIGNMENT_COLOR_CALC_STATE;
553 const uint8_t cmd_len = 6;
554 XGL_UINT pos;
555 uint32_t *dw;
556
557 CMD_ASSERT(cmd, 6, 7.5);
558
559 dw = cmd_state_reserve(cmd, cmd_len, cmd_align, &pos);
560 dw[0] = stencil_ref;
561 dw[1] = 0;
562 dw[2] = blend_color[0];
563 dw[3] = blend_color[1];
564 dw[4] = blend_color[2];
565 dw[5] = blend_color[3];
566 cmd_state_advance(cmd, cmd_len);
567
568 return pos;
569}
570
Chia-I Wu48c283d2014-08-25 23:13:46 +0800571static void gen6_wa_post_sync_flush(struct intel_cmd *cmd)
572{
Chia-I Wu707a29e2014-08-27 12:51:47 +0800573 if (!cmd->bind.draw_count)
574 return;
575
Chia-I Wu48c283d2014-08-25 23:13:46 +0800576 if (cmd->bind.wa_flags & GEN6_WA_POST_SYNC_FLUSH)
577 return;
578
579 CMD_ASSERT(cmd, 6, 7.5);
580
581 cmd->bind.wa_flags |= GEN6_WA_POST_SYNC_FLUSH;
582
583 /*
584 * From the Sandy Bridge PRM, volume 2 part 1, page 60:
585 *
586 * "Pipe-control with CS-stall bit set must be sent BEFORE the
587 * pipe-control with a post-sync op and no write-cache flushes."
588 *
589 * The workaround below necessitates this workaround.
590 */
591 gen6_PIPE_CONTROL(cmd,
592 GEN6_PIPE_CONTROL_CS_STALL |
593 GEN6_PIPE_CONTROL_PIXEL_SCOREBOARD_STALL,
594 NULL, 0);
595
596 /*
597 * From the Sandy Bridge PRM, volume 2 part 1, page 60:
598 *
599 * "Before any depth stall flush (including those produced by
600 * non-pipelined state commands), software needs to first send a
601 * PIPE_CONTROL with no bits set except Post-Sync Operation != 0."
602 *
603 * "Before a PIPE_CONTROL with Write Cache Flush Enable =1, a
604 * PIPE_CONTROL with any non-zero post-sync-op is required."
605 */
606 gen6_PIPE_CONTROL(cmd, GEN6_PIPE_CONTROL_WRITE_IMM, cmd->scratch_bo, 0);
607}
608
609static void gen6_wa_ds_flush(struct intel_cmd *cmd)
610{
Chia-I Wu707a29e2014-08-27 12:51:47 +0800611 if (!cmd->bind.draw_count)
612 return;
613
Chia-I Wu48c283d2014-08-25 23:13:46 +0800614 if (cmd->bind.wa_flags & GEN6_WA_DS_FLUSH)
615 return;
616
617 CMD_ASSERT(cmd, 6, 7.5);
618
619 cmd->bind.wa_flags |= GEN6_WA_DS_FLUSH;
620
621 gen6_wa_post_sync_flush(cmd);
622
623 gen6_PIPE_CONTROL(cmd, GEN6_PIPE_CONTROL_DEPTH_STALL, NULL, 0);
624 gen6_PIPE_CONTROL(cmd, GEN6_PIPE_CONTROL_DEPTH_CACHE_FLUSH, NULL, 0);
625 gen6_PIPE_CONTROL(cmd, GEN6_PIPE_CONTROL_DEPTH_STALL, NULL, 0);
626}
627
Chia-I Wu525c6602014-08-27 10:22:34 +0800628void cmd_batch_flush(struct intel_cmd *cmd, uint32_t pipe_control_dw0)
629{
630 if (!cmd->bind.draw_count)
631 return;
632
633 assert(!(pipe_control_dw0 & GEN6_PIPE_CONTROL_WRITE__MASK));
634
635 if (pipe_control_dw0 & GEN6_PIPE_CONTROL_RENDER_CACHE_FLUSH)
636 gen6_wa_post_sync_flush(cmd);
637
638 gen6_PIPE_CONTROL(cmd, pipe_control_dw0, NULL, 0);
639}
640
Chia-I Wu302742d2014-08-22 10:28:29 +0800641static void gen6_cc_states(struct intel_cmd *cmd)
642{
643 const struct intel_blend_state *blend = cmd->bind.state.blend;
644 const struct intel_ds_state *ds = cmd->bind.state.ds;
645 XGL_UINT blend_pos, ds_pos, cc_pos;
Chia-I Wuce9f11f2014-08-22 10:38:51 +0800646 uint32_t stencil_ref;
647 uint32_t blend_color[4];
Chia-I Wu302742d2014-08-22 10:28:29 +0800648
649 CMD_ASSERT(cmd, 6, 6);
650
Chia-I Wuce9f11f2014-08-22 10:38:51 +0800651 if (blend) {
652 blend_pos = gen6_BLEND_STATE(cmd, blend);
653 memcpy(blend_color, blend->cmd_blend_color, sizeof(blend_color));
654 } else {
655 blend_pos = 0;
656 memset(blend_color, 0, sizeof(blend_color));
657 }
658
659 if (ds) {
660 ds_pos = gen6_DEPTH_STENCIL_STATE(cmd, ds);
661 stencil_ref = ds->cmd_stencil_ref;
662 } else {
663 ds_pos = 0;
664 stencil_ref = 0;
665 }
666
667 cc_pos = gen6_COLOR_CALC_STATE(cmd, stencil_ref, blend_color);
Chia-I Wu302742d2014-08-22 10:28:29 +0800668
669 gen6_3DSTATE_CC_STATE_POINTERS(cmd, blend_pos, ds_pos, cc_pos);
670}
671
Chia-I Wu1744cca2014-08-22 11:10:17 +0800672static void gen6_viewport_states(struct intel_cmd *cmd)
673{
674 const struct intel_viewport_state *viewport = cmd->bind.state.viewport;
675 XGL_UINT pos;
676
677 if (!viewport)
678 return;
679
680 pos = cmd_state_copy(cmd, viewport->cmd, viewport->cmd_len,
681 viewport->cmd_align);
682
683 gen6_3DSTATE_VIEWPORT_STATE_POINTERS(cmd,
684 pos + viewport->cmd_clip_offset,
685 pos,
686 pos + viewport->cmd_cc_offset);
687
688 pos = (viewport->scissor_enable) ?
689 pos + viewport->cmd_scissor_rect_offset : 0;
690
691 gen6_3DSTATE_SCISSOR_STATE_POINTERS(cmd, pos);
692}
693
Chia-I Wu302742d2014-08-22 10:28:29 +0800694static void gen7_cc_states(struct intel_cmd *cmd)
695{
696 const struct intel_blend_state *blend = cmd->bind.state.blend;
697 const struct intel_ds_state *ds = cmd->bind.state.ds;
Chia-I Wuce9f11f2014-08-22 10:38:51 +0800698 uint32_t stencil_ref;
699 uint32_t blend_color[4];
Chia-I Wu302742d2014-08-22 10:28:29 +0800700 XGL_UINT pos;
701
702 CMD_ASSERT(cmd, 7, 7.5);
703
Chia-I Wuce9f11f2014-08-22 10:38:51 +0800704 if (!blend && !ds)
705 return;
Chia-I Wu302742d2014-08-22 10:28:29 +0800706
Chia-I Wuce9f11f2014-08-22 10:38:51 +0800707 if (blend) {
708 pos = gen6_BLEND_STATE(cmd, blend);
709 gen7_3dstate_pointer(cmd,
710 GEN7_RENDER_OPCODE_3DSTATE_BLEND_STATE_POINTERS, pos);
Chia-I Wu302742d2014-08-22 10:28:29 +0800711
Chia-I Wuce9f11f2014-08-22 10:38:51 +0800712 memcpy(blend_color, blend->cmd_blend_color, sizeof(blend_color));
713 } else {
714 memset(blend_color, 0, sizeof(blend_color));
715 }
716
717 if (ds) {
718 pos = gen6_DEPTH_STENCIL_STATE(cmd, ds);
719 gen7_3dstate_pointer(cmd,
720 GEN7_RENDER_OPCODE_3DSTATE_DEPTH_STENCIL_STATE_POINTERS, pos);
721 } else {
722 stencil_ref = 0;
723 }
724
725 pos = gen6_COLOR_CALC_STATE(cmd, stencil_ref, blend_color);
Chia-I Wu302742d2014-08-22 10:28:29 +0800726 gen7_3dstate_pointer(cmd,
727 GEN6_RENDER_OPCODE_3DSTATE_CC_STATE_POINTERS, pos);
728}
729
Chia-I Wu1744cca2014-08-22 11:10:17 +0800730static void gen7_viewport_states(struct intel_cmd *cmd)
731{
732 const struct intel_viewport_state *viewport = cmd->bind.state.viewport;
733 XGL_UINT pos;
734
735 if (!viewport)
736 return;
737
738 pos = cmd_state_copy(cmd, viewport->cmd, viewport->cmd_len,
739 viewport->cmd_align);
740
741 gen7_3dstate_pointer(cmd,
742 GEN7_RENDER_OPCODE_3DSTATE_VIEWPORT_STATE_POINTERS_SF_CLIP, pos);
743 gen7_3dstate_pointer(cmd,
744 GEN7_RENDER_OPCODE_3DSTATE_VIEWPORT_STATE_POINTERS_CC,
745 pos + viewport->cmd_cc_offset);
746 if (viewport->scissor_enable) {
747 gen7_3dstate_pointer(cmd,
748 GEN6_RENDER_OPCODE_3DSTATE_SCISSOR_STATE_POINTERS,
749 pos + viewport->cmd_scissor_rect_offset);
750 }
751}
752
Chia-I Wu7fd5cac2014-08-27 13:19:29 +0800753static void gen6_pcb(struct intel_cmd *cmd, int subop,
754 const XGL_PIPELINE_SHADER *sh)
755{
756 const uint8_t cmd_len = 5;
757 const XGL_UINT alignment = 32;
758 const XGL_UINT max_size =
759 (subop == GEN6_RENDER_OPCODE_3DSTATE_CONSTANT_VS) ? 1024 : 2048;
760 const XGL_UINT max_pcb = 4;
761 uint32_t pcb[4] = { 0, 0, 0, 0 };
762 XGL_FLAGS pcb_enables = 0;
763 XGL_SIZE total_size = 0;
764 uint32_t dw0;
765 XGL_UINT i;
766
767 for (i = 0; i < sh->linkConstBufferCount; i++) {
768 const XGL_LINK_CONST_BUFFER *info = &sh->pLinkConstBufferInfo[i];
769 const XGL_SIZE size = u_align(info->bufferSize, alignment);
770 void *ptr;
771
772 if (info->bufferId >= max_pcb ||
773 pcb_enables & ((1 << info->bufferId)) ||
774 total_size + info->bufferSize > max_size) {
775 cmd->result = XGL_ERROR_UNKNOWN;
776 return;
777 }
778 if (!size)
779 continue;
780
781 pcb_enables |= 1 << info->bufferId;
782 total_size += size;
783
784 ptr = cmd_state_reserve(cmd, size / sizeof(uint32_t),
785 alignment / sizeof(uint32_t), &pcb[info->bufferId]);
786 memcpy(ptr, info->pBufferData, info->bufferSize);
787 cmd_state_advance(cmd, size / sizeof(uint32_t));
788
789 pcb[info->bufferId] |= size / alignment - 1;
790 }
791
792 dw0 = GEN6_RENDER_TYPE_RENDER |
793 GEN6_RENDER_SUBTYPE_3D |
794 subop |
795 pcb_enables << 12 |
796 (cmd_len - 2);
797
798 cmd_batch_reserve(cmd, cmd_len);
799 cmd_batch_write(cmd, dw0);
800 cmd_batch_write(cmd, pcb[0]);
801 cmd_batch_write(cmd, pcb[1]);
802 cmd_batch_write(cmd, pcb[2]);
803 cmd_batch_write(cmd, pcb[3]);
804}
805
806static void gen7_pcb(struct intel_cmd *cmd, int subop,
807 const XGL_PIPELINE_SHADER *sh)
808{
809 const uint8_t cmd_len = 7;
810 const uint32_t dw0 = GEN6_RENDER_TYPE_RENDER |
811 GEN6_RENDER_SUBTYPE_3D |
812 subop |
813 (cmd_len - 2);
814 const XGL_UINT alignment = 32;
815 const XGL_UINT max_size = 2048;
816 const XGL_UINT max_pcb = 4;
817 uint16_t pcb_len[4] = { 0, 0, 0, 0 };
818 uint32_t pcb[4] = { 0, 0, 0, 0 };
819 XGL_FLAGS pcb_enables = 0;
820 XGL_SIZE total_size = 0;
821 XGL_UINT i;
822
823 for (i = 0; i < sh->linkConstBufferCount; i++) {
824 const XGL_LINK_CONST_BUFFER *info = &sh->pLinkConstBufferInfo[i];
825 const XGL_SIZE size = u_align(info->bufferSize, alignment);
826 void *ptr;
827
828 if (info->bufferId >= max_pcb ||
829 pcb_enables & ((1 << info->bufferId)) ||
830 total_size + info->bufferSize > max_size) {
831 cmd->result = XGL_ERROR_UNKNOWN;
832 return;
833 }
834 if (!size)
835 continue;
836
837 pcb_enables |= 1 << info->bufferId;
838 total_size += size;
839
840 pcb_len[info->bufferId] = size / alignment;
841
842 ptr = cmd_state_reserve(cmd, size / sizeof(uint32_t),
843 alignment / sizeof(uint32_t), &pcb[info->bufferId]);
844 memcpy(ptr, info->pBufferData, info->bufferSize);
845 cmd_state_advance(cmd, size / sizeof(uint32_t));
846 }
847
848 /* no holes */
849 if (!u_is_pow2(pcb_enables + 1)) {
850 cmd->result = XGL_ERROR_UNKNOWN;
851 return;
852 }
853
854 cmd_batch_reserve(cmd, cmd_len);
855 cmd_batch_write(cmd, dw0);
856 cmd_batch_write(cmd, pcb_len[1] << 16 | pcb_len[0]);
857 cmd_batch_write(cmd, pcb_len[3] << 16 | pcb_len[2]);
858 cmd_batch_write(cmd, pcb[0]);
859 cmd_batch_write(cmd, pcb[1]);
860 cmd_batch_write(cmd, pcb[2]);
861 cmd_batch_write(cmd, pcb[3]);
862}
863
Chia-I Wu42a56202014-08-23 16:47:48 +0800864static void emit_ps_resources(struct intel_cmd *cmd,
865 const struct intel_rmap *rmap)
866{
867 const XGL_UINT surface_count = rmap->rt_count +
868 rmap->resource_count + rmap->uav_count;
869 uint32_t binding_table[256];
870 XGL_UINT pos, i;
871
872 assert(surface_count <= ARRAY_SIZE(binding_table));
873
874 for (i = 0; i < surface_count; i++) {
875 const struct intel_rmap_slot *slot = &rmap->slots[i];
876 uint32_t *dw;
877
878 switch (slot->path_len) {
879 case 0:
880 pos = 0;
881 break;
882 case INTEL_RMAP_SLOT_RT:
883 {
884 const struct intel_rt_view *view = cmd->bind.att.rt[i];
885
886 dw = cmd_state_reserve_reloc(cmd, view->cmd_len, 1,
887 GEN6_ALIGNMENT_SURFACE_STATE, &pos);
888
889 memcpy(dw, view->cmd, sizeof(uint32_t) * view->cmd_len);
Chia-I Wubda55fd2014-08-25 12:46:10 +0800890 cmd_state_reloc(cmd, 1, view->cmd[1], view->img->obj.mem->bo,
Chia-I Wu32a22462014-08-26 14:13:46 +0800891 INTEL_RELOC_WRITE);
Chia-I Wu42a56202014-08-23 16:47:48 +0800892 cmd_state_advance(cmd, view->cmd_len);
893 }
894 break;
895 case INTEL_RMAP_SLOT_DYN:
896 {
897 const struct intel_mem_view *view =
Chia-I Wu9f1722c2014-08-25 10:17:58 +0800898 &cmd->bind.dyn_view.graphics;
Chia-I Wu42a56202014-08-23 16:47:48 +0800899
900 dw = cmd_state_reserve_reloc(cmd, view->cmd_len, 1,
901 GEN6_ALIGNMENT_SURFACE_STATE, &pos);
902
903 memcpy(dw, view->cmd, sizeof(uint32_t) * view->cmd_len);
Chia-I Wubda55fd2014-08-25 12:46:10 +0800904 cmd_state_reloc(cmd, 1, view->cmd[1], view->mem->bo,
Chia-I Wu32a22462014-08-26 14:13:46 +0800905 INTEL_RELOC_WRITE);
Chia-I Wu42a56202014-08-23 16:47:48 +0800906 cmd_state_advance(cmd, view->cmd_len);
907 }
908 break;
909 case 1:
910 default:
911 /* TODO */
912 assert(!"no dset support");
913 break;
914 }
915
916 binding_table[i] = pos << 2;
917 }
918
919 pos = cmd_state_copy(cmd, binding_table, surface_count,
920 GEN6_ALIGNMENT_BINDING_TABLE_STATE);
921
922 if (cmd_gen(cmd) >= INTEL_GEN(7)) {
923 gen7_3dstate_pointer(cmd,
924 GEN7_RENDER_OPCODE_3DSTATE_BINDING_TABLE_POINTERS_PS, pos);
925 } else {
926 gen6_3DSTATE_BINDING_TABLE_POINTERS(cmd, 0, 0, pos);
927 }
928}
929
Chia-I Wu52500102014-08-22 00:46:04 +0800930static void emit_bounded_states(struct intel_cmd *cmd)
931{
932 const struct intel_msaa_state *msaa = cmd->bind.state.msaa;
933
934 /* TODO more states */
935
Chia-I Wu1744cca2014-08-22 11:10:17 +0800936 if (cmd_gen(cmd) >= INTEL_GEN(7)) {
Chia-I Wu302742d2014-08-22 10:28:29 +0800937 gen7_cc_states(cmd);
Chia-I Wu1744cca2014-08-22 11:10:17 +0800938 gen7_viewport_states(cmd);
Chia-I Wu7fd5cac2014-08-27 13:19:29 +0800939
940 gen7_pcb(cmd, GEN6_RENDER_OPCODE_3DSTATE_CONSTANT_VS,
941 &cmd->bind.pipeline.graphics->vs);
942 gen7_pcb(cmd, GEN6_RENDER_OPCODE_3DSTATE_CONSTANT_PS,
943 &cmd->bind.pipeline.graphics->fs);
Chia-I Wu1744cca2014-08-22 11:10:17 +0800944 } else {
Chia-I Wu302742d2014-08-22 10:28:29 +0800945 gen6_cc_states(cmd);
Chia-I Wu1744cca2014-08-22 11:10:17 +0800946 gen6_viewport_states(cmd);
Chia-I Wu7fd5cac2014-08-27 13:19:29 +0800947
948 gen6_pcb(cmd, GEN6_RENDER_OPCODE_3DSTATE_CONSTANT_VS,
949 &cmd->bind.pipeline.graphics->vs);
950 gen6_pcb(cmd, GEN6_RENDER_OPCODE_3DSTATE_CONSTANT_PS,
951 &cmd->bind.pipeline.graphics->fs);
Chia-I Wu1744cca2014-08-22 11:10:17 +0800952 }
Chia-I Wu302742d2014-08-22 10:28:29 +0800953
Chia-I Wu42a56202014-08-23 16:47:48 +0800954 emit_ps_resources(cmd, cmd->bind.pipeline.graphics->fs_rmap);
955
Chia-I Wu52500102014-08-22 00:46:04 +0800956 /* 3DSTATE_MULTISAMPLE and 3DSTATE_SAMPLE_MASK */
Chia-I Wu48c283d2014-08-25 23:13:46 +0800957 gen6_wa_post_sync_flush(cmd);
Chia-I Wu52500102014-08-22 00:46:04 +0800958 cmd_batch_reserve(cmd, msaa->cmd_len);
959 cmd_batch_write_n(cmd, msaa->cmd, msaa->cmd_len);
960}
961
Chia-I Wu9f1722c2014-08-25 10:17:58 +0800962static void cmd_bind_graphics_pipeline(struct intel_cmd *cmd,
963 const struct intel_pipeline *pipeline)
964{
965 cmd->bind.pipeline.graphics = pipeline;
966}
967
968static void cmd_bind_compute_pipeline(struct intel_cmd *cmd,
969 const struct intel_pipeline *pipeline)
970{
971 cmd->bind.pipeline.compute = pipeline;
972}
973
974static void cmd_bind_graphics_delta(struct intel_cmd *cmd,
975 const struct intel_pipeline_delta *delta)
976{
977 cmd->bind.pipeline.graphics_delta = delta;
978}
979
980static void cmd_bind_compute_delta(struct intel_cmd *cmd,
981 const struct intel_pipeline_delta *delta)
982{
983 cmd->bind.pipeline.compute_delta = delta;
984}
985
986static void cmd_bind_graphics_dset(struct intel_cmd *cmd,
987 const struct intel_dset *dset,
988 XGL_UINT slot_offset)
989{
990 cmd->bind.dset.graphics = dset;
991 cmd->bind.dset.graphics_offset = slot_offset;
992}
993
994static void cmd_bind_compute_dset(struct intel_cmd *cmd,
995 const struct intel_dset *dset,
996 XGL_UINT slot_offset)
997{
998 cmd->bind.dset.compute = dset;
999 cmd->bind.dset.compute_offset = slot_offset;
1000}
1001
1002static void cmd_bind_graphics_dyn_view(struct intel_cmd *cmd,
1003 const XGL_MEMORY_VIEW_ATTACH_INFO *info)
1004{
1005 intel_mem_view_init(&cmd->bind.dyn_view.graphics, cmd->dev, info);
1006}
1007
1008static void cmd_bind_compute_dyn_view(struct intel_cmd *cmd,
1009 const XGL_MEMORY_VIEW_ATTACH_INFO *info)
1010{
1011 intel_mem_view_init(&cmd->bind.dyn_view.compute, cmd->dev, info);
1012}
1013
1014static void cmd_bind_index_data(struct intel_cmd *cmd,
1015 const struct intel_mem *mem,
1016 XGL_GPU_SIZE offset, XGL_INDEX_TYPE type)
1017{
1018 if (cmd_gen(cmd) >= INTEL_GEN(7.5)) {
1019 gen6_3DSTATE_INDEX_BUFFER(cmd, mem, offset, type, false);
1020 } else {
1021 cmd->bind.index.mem = mem;
1022 cmd->bind.index.offset = offset;
1023 cmd->bind.index.type = type;
1024 }
1025}
1026
1027static void cmd_bind_rt(struct intel_cmd *cmd,
1028 const XGL_COLOR_ATTACHMENT_BIND_INFO *attachments,
1029 XGL_UINT count)
1030{
Chia-I Wud88e02d2014-08-25 10:56:13 +08001031 XGL_UINT width = 0, height = 0;
Chia-I Wu9f1722c2014-08-25 10:17:58 +08001032 XGL_UINT i;
1033
1034 for (i = 0; i < count; i++) {
1035 const XGL_COLOR_ATTACHMENT_BIND_INFO *att = &attachments[i];
1036 const struct intel_rt_view *rt = intel_rt_view(att->view);
Chia-I Wud88e02d2014-08-25 10:56:13 +08001037 const struct intel_layout *layout = &rt->img->layout;
1038
1039 if (i == 0) {
1040 width = layout->width0;
1041 height = layout->height0;
1042 } else {
1043 if (width > layout->width0)
1044 width = layout->width0;
1045 if (height > layout->height0)
1046 height = layout->height0;
1047 }
Chia-I Wu9f1722c2014-08-25 10:17:58 +08001048
1049 cmd->bind.att.rt[i] = rt;
1050 }
1051
1052 cmd->bind.att.rt_count = count;
Chia-I Wud88e02d2014-08-25 10:56:13 +08001053
Chia-I Wu48c283d2014-08-25 23:13:46 +08001054 gen6_wa_post_sync_flush(cmd);
Chia-I Wud88e02d2014-08-25 10:56:13 +08001055 gen6_3DSTATE_DRAWING_RECTANGLE(cmd, width, height);
Chia-I Wu9f1722c2014-08-25 10:17:58 +08001056}
1057
1058static void cmd_bind_ds(struct intel_cmd *cmd,
1059 const XGL_DEPTH_STENCIL_BIND_INFO *info)
1060{
1061 const struct intel_ds_view *ds;
1062
1063 if (info) {
1064 cmd->bind.att.ds = intel_ds_view(info->view);
1065 ds = cmd->bind.att.ds;
1066 } else {
1067 /* all zeros */
1068 static const struct intel_ds_view null_ds;
1069 ds = &null_ds;
1070 }
1071
Chia-I Wu48c283d2014-08-25 23:13:46 +08001072 gen6_wa_ds_flush(cmd);
Chia-I Wu9f1722c2014-08-25 10:17:58 +08001073 gen6_3DSTATE_DEPTH_BUFFER(cmd, ds);
1074 gen6_3DSTATE_STENCIL_BUFFER(cmd, ds);
1075 gen6_3DSTATE_HIER_DEPTH_BUFFER(cmd, ds);
Chia-I Wuf8231032014-08-25 10:44:45 +08001076
1077 if (cmd_gen(cmd) >= INTEL_GEN(7))
1078 gen7_3DSTATE_CLEAR_PARAMS(cmd, 0);
1079 else
1080 gen6_3DSTATE_CLEAR_PARAMS(cmd, 0);
Chia-I Wu9f1722c2014-08-25 10:17:58 +08001081}
1082
1083static void cmd_bind_viewport_state(struct intel_cmd *cmd,
1084 const struct intel_viewport_state *state)
1085{
1086 cmd->bind.state.viewport = state;
1087}
1088
1089static void cmd_bind_raster_state(struct intel_cmd *cmd,
1090 const struct intel_raster_state *state)
1091{
1092 cmd->bind.state.raster = state;
1093}
1094
1095static void cmd_bind_ds_state(struct intel_cmd *cmd,
1096 const struct intel_ds_state *state)
1097{
1098 cmd->bind.state.ds = state;
1099}
1100
1101static void cmd_bind_blend_state(struct intel_cmd *cmd,
1102 const struct intel_blend_state *state)
1103{
1104 cmd->bind.state.blend = state;
1105}
1106
1107static void cmd_bind_msaa_state(struct intel_cmd *cmd,
1108 const struct intel_msaa_state *state)
1109{
1110 cmd->bind.state.msaa = state;
1111}
1112
1113static void cmd_draw(struct intel_cmd *cmd,
1114 XGL_UINT vertex_start,
1115 XGL_UINT vertex_count,
1116 XGL_UINT instance_start,
1117 XGL_UINT instance_count,
1118 bool indexed,
1119 XGL_UINT vertex_base)
1120{
1121 const struct intel_pipeline *p = cmd->bind.pipeline.graphics;
1122
1123 emit_bounded_states(cmd);
1124
1125 if (indexed) {
1126 if (p->primitive_restart && !gen6_can_primitive_restart(cmd))
1127 cmd->result = XGL_ERROR_UNKNOWN;
1128
1129 if (cmd_gen(cmd) >= INTEL_GEN(7.5)) {
1130 gen75_3DSTATE_VF(cmd, p->primitive_restart,
1131 p->primitive_restart_index);
1132 } else {
1133 gen6_3DSTATE_INDEX_BUFFER(cmd, cmd->bind.index.mem,
1134 cmd->bind.index.offset, cmd->bind.index.type,
1135 p->primitive_restart);
1136 }
1137 } else {
1138 assert(!vertex_base);
1139 }
1140
1141 if (cmd_gen(cmd) >= INTEL_GEN(7)) {
1142 gen7_3DPRIMITIVE(cmd, p->prim_type, indexed, vertex_count,
1143 vertex_start, instance_count, instance_start, vertex_base);
1144 } else {
1145 gen6_3DPRIMITIVE(cmd, p->prim_type, indexed, vertex_count,
1146 vertex_start, instance_count, instance_start, vertex_base);
1147 }
Chia-I Wu48c283d2014-08-25 23:13:46 +08001148
Chia-I Wu707a29e2014-08-27 12:51:47 +08001149 cmd->bind.draw_count++;
Chia-I Wu48c283d2014-08-25 23:13:46 +08001150 /* need to re-emit all workarounds */
1151 cmd->bind.wa_flags = 0;
Chia-I Wu9f1722c2014-08-25 10:17:58 +08001152}
1153
Chia-I Wub2755562014-08-20 13:38:52 +08001154XGL_VOID XGLAPI intelCmdBindPipeline(
1155 XGL_CMD_BUFFER cmdBuffer,
1156 XGL_PIPELINE_BIND_POINT pipelineBindPoint,
1157 XGL_PIPELINE pipeline)
1158{
1159 struct intel_cmd *cmd = intel_cmd(cmdBuffer);
1160
1161 switch (pipelineBindPoint) {
1162 case XGL_PIPELINE_BIND_POINT_COMPUTE:
Chia-I Wu9f1722c2014-08-25 10:17:58 +08001163 cmd_bind_compute_pipeline(cmd, intel_pipeline(pipeline));
Chia-I Wub2755562014-08-20 13:38:52 +08001164 break;
1165 case XGL_PIPELINE_BIND_POINT_GRAPHICS:
Chia-I Wu9f1722c2014-08-25 10:17:58 +08001166 cmd_bind_graphics_pipeline(cmd, intel_pipeline(pipeline));
Chia-I Wub2755562014-08-20 13:38:52 +08001167 break;
1168 default:
Chia-I Wu9f1722c2014-08-25 10:17:58 +08001169 cmd->result = XGL_ERROR_INVALID_VALUE;
Chia-I Wub2755562014-08-20 13:38:52 +08001170 break;
1171 }
1172}
1173
1174XGL_VOID XGLAPI intelCmdBindPipelineDelta(
1175 XGL_CMD_BUFFER cmdBuffer,
1176 XGL_PIPELINE_BIND_POINT pipelineBindPoint,
1177 XGL_PIPELINE_DELTA delta)
1178{
1179 struct intel_cmd *cmd = intel_cmd(cmdBuffer);
1180
1181 switch (pipelineBindPoint) {
1182 case XGL_PIPELINE_BIND_POINT_COMPUTE:
Chia-I Wu9f1722c2014-08-25 10:17:58 +08001183 cmd_bind_compute_delta(cmd, delta);
Chia-I Wub2755562014-08-20 13:38:52 +08001184 break;
1185 case XGL_PIPELINE_BIND_POINT_GRAPHICS:
Chia-I Wu9f1722c2014-08-25 10:17:58 +08001186 cmd_bind_graphics_delta(cmd, delta);
Chia-I Wub2755562014-08-20 13:38:52 +08001187 break;
1188 default:
Chia-I Wu9f1722c2014-08-25 10:17:58 +08001189 cmd->result = XGL_ERROR_INVALID_VALUE;
Chia-I Wub2755562014-08-20 13:38:52 +08001190 break;
1191 }
1192}
1193
1194XGL_VOID XGLAPI intelCmdBindStateObject(
1195 XGL_CMD_BUFFER cmdBuffer,
1196 XGL_STATE_BIND_POINT stateBindPoint,
1197 XGL_STATE_OBJECT state)
1198{
1199 struct intel_cmd *cmd = intel_cmd(cmdBuffer);
1200
1201 switch (stateBindPoint) {
1202 case XGL_STATE_BIND_VIEWPORT:
Chia-I Wu9f1722c2014-08-25 10:17:58 +08001203 cmd_bind_viewport_state(cmd,
1204 intel_viewport_state((XGL_VIEWPORT_STATE_OBJECT) state));
Chia-I Wub2755562014-08-20 13:38:52 +08001205 break;
1206 case XGL_STATE_BIND_RASTER:
Chia-I Wu9f1722c2014-08-25 10:17:58 +08001207 cmd_bind_raster_state(cmd,
1208 intel_raster_state((XGL_RASTER_STATE_OBJECT) state));
Chia-I Wub2755562014-08-20 13:38:52 +08001209 break;
1210 case XGL_STATE_BIND_DEPTH_STENCIL:
Chia-I Wu9f1722c2014-08-25 10:17:58 +08001211 cmd_bind_ds_state(cmd,
1212 intel_ds_state((XGL_DEPTH_STENCIL_STATE_OBJECT) state));
Chia-I Wub2755562014-08-20 13:38:52 +08001213 break;
1214 case XGL_STATE_BIND_COLOR_BLEND:
Chia-I Wu9f1722c2014-08-25 10:17:58 +08001215 cmd_bind_blend_state(cmd,
1216 intel_blend_state((XGL_COLOR_BLEND_STATE_OBJECT) state));
Chia-I Wub2755562014-08-20 13:38:52 +08001217 break;
1218 case XGL_STATE_BIND_MSAA:
Chia-I Wu9f1722c2014-08-25 10:17:58 +08001219 cmd_bind_msaa_state(cmd,
1220 intel_msaa_state((XGL_MSAA_STATE_OBJECT) state));
Chia-I Wub2755562014-08-20 13:38:52 +08001221 break;
1222 default:
Chia-I Wu9f1722c2014-08-25 10:17:58 +08001223 cmd->result = XGL_ERROR_INVALID_VALUE;
Chia-I Wub2755562014-08-20 13:38:52 +08001224 break;
1225 }
1226}
1227
1228XGL_VOID XGLAPI intelCmdBindDescriptorSet(
1229 XGL_CMD_BUFFER cmdBuffer,
1230 XGL_PIPELINE_BIND_POINT pipelineBindPoint,
1231 XGL_UINT index,
1232 XGL_DESCRIPTOR_SET descriptorSet,
1233 XGL_UINT slotOffset)
1234{
1235 struct intel_cmd *cmd = intel_cmd(cmdBuffer);
1236 struct intel_dset *dset = intel_dset(descriptorSet);
1237
1238 assert(!index);
1239
1240 switch (pipelineBindPoint) {
1241 case XGL_PIPELINE_BIND_POINT_COMPUTE:
Chia-I Wu9f1722c2014-08-25 10:17:58 +08001242 cmd_bind_compute_dset(cmd, dset, slotOffset);
Chia-I Wub2755562014-08-20 13:38:52 +08001243 break;
1244 case XGL_PIPELINE_BIND_POINT_GRAPHICS:
Chia-I Wu9f1722c2014-08-25 10:17:58 +08001245 cmd_bind_graphics_dset(cmd, dset, slotOffset);
Chia-I Wub2755562014-08-20 13:38:52 +08001246 break;
1247 default:
Chia-I Wu9f1722c2014-08-25 10:17:58 +08001248 cmd->result = XGL_ERROR_INVALID_VALUE;
Chia-I Wub2755562014-08-20 13:38:52 +08001249 break;
1250 }
1251}
1252
1253XGL_VOID XGLAPI intelCmdBindDynamicMemoryView(
1254 XGL_CMD_BUFFER cmdBuffer,
1255 XGL_PIPELINE_BIND_POINT pipelineBindPoint,
1256 const XGL_MEMORY_VIEW_ATTACH_INFO* pMemView)
1257{
1258 struct intel_cmd *cmd = intel_cmd(cmdBuffer);
1259
1260 switch (pipelineBindPoint) {
1261 case XGL_PIPELINE_BIND_POINT_COMPUTE:
Chia-I Wu9f1722c2014-08-25 10:17:58 +08001262 cmd_bind_compute_dyn_view(cmd, pMemView);
Chia-I Wub2755562014-08-20 13:38:52 +08001263 break;
1264 case XGL_PIPELINE_BIND_POINT_GRAPHICS:
Chia-I Wu9f1722c2014-08-25 10:17:58 +08001265 cmd_bind_graphics_dyn_view(cmd, pMemView);
Chia-I Wub2755562014-08-20 13:38:52 +08001266 break;
1267 default:
Chia-I Wu9f1722c2014-08-25 10:17:58 +08001268 cmd->result = XGL_ERROR_INVALID_VALUE;
Chia-I Wub2755562014-08-20 13:38:52 +08001269 break;
1270 }
1271}
1272
1273XGL_VOID XGLAPI intelCmdBindIndexData(
1274 XGL_CMD_BUFFER cmdBuffer,
1275 XGL_GPU_MEMORY mem_,
1276 XGL_GPU_SIZE offset,
1277 XGL_INDEX_TYPE indexType)
1278{
1279 struct intel_cmd *cmd = intel_cmd(cmdBuffer);
1280 struct intel_mem *mem = intel_mem(mem_);
1281
Chia-I Wu9f1722c2014-08-25 10:17:58 +08001282 cmd_bind_index_data(cmd, mem, offset, indexType);
Chia-I Wub2755562014-08-20 13:38:52 +08001283}
1284
1285XGL_VOID XGLAPI intelCmdBindAttachments(
1286 XGL_CMD_BUFFER cmdBuffer,
1287 XGL_UINT colorAttachmentCount,
1288 const XGL_COLOR_ATTACHMENT_BIND_INFO* pColorAttachments,
1289 const XGL_DEPTH_STENCIL_BIND_INFO* pDepthStencilAttachment)
1290{
1291 struct intel_cmd *cmd = intel_cmd(cmdBuffer);
Chia-I Wub2755562014-08-20 13:38:52 +08001292
Chia-I Wu9f1722c2014-08-25 10:17:58 +08001293 cmd_bind_rt(cmd, pColorAttachments, colorAttachmentCount);
1294 cmd_bind_ds(cmd, pDepthStencilAttachment);
Chia-I Wub2755562014-08-20 13:38:52 +08001295}
1296
1297XGL_VOID XGLAPI intelCmdDraw(
1298 XGL_CMD_BUFFER cmdBuffer,
1299 XGL_UINT firstVertex,
1300 XGL_UINT vertexCount,
1301 XGL_UINT firstInstance,
1302 XGL_UINT instanceCount)
1303{
Chia-I Wu59c097e2014-08-21 10:51:07 +08001304 struct intel_cmd *cmd = intel_cmd(cmdBuffer);
Chia-I Wu59c097e2014-08-21 10:51:07 +08001305
Chia-I Wu9f1722c2014-08-25 10:17:58 +08001306 cmd_draw(cmd, firstVertex, vertexCount,
1307 firstInstance, instanceCount, false, 0);
Chia-I Wub2755562014-08-20 13:38:52 +08001308}
1309
1310XGL_VOID XGLAPI intelCmdDrawIndexed(
1311 XGL_CMD_BUFFER cmdBuffer,
1312 XGL_UINT firstIndex,
1313 XGL_UINT indexCount,
1314 XGL_INT vertexOffset,
1315 XGL_UINT firstInstance,
1316 XGL_UINT instanceCount)
1317{
Chia-I Wu59c097e2014-08-21 10:51:07 +08001318 struct intel_cmd *cmd = intel_cmd(cmdBuffer);
Chia-I Wu59c097e2014-08-21 10:51:07 +08001319
Chia-I Wu9f1722c2014-08-25 10:17:58 +08001320 cmd_draw(cmd, firstIndex, indexCount,
1321 firstInstance, instanceCount, true, vertexOffset);
Chia-I Wub2755562014-08-20 13:38:52 +08001322}
1323
1324XGL_VOID XGLAPI intelCmdDrawIndirect(
1325 XGL_CMD_BUFFER cmdBuffer,
1326 XGL_GPU_MEMORY mem,
1327 XGL_GPU_SIZE offset,
1328 XGL_UINT32 count,
1329 XGL_UINT32 stride)
1330{
Chia-I Wu59c097e2014-08-21 10:51:07 +08001331 struct intel_cmd *cmd = intel_cmd(cmdBuffer);
1332
1333 cmd->result = XGL_ERROR_UNKNOWN;
Chia-I Wub2755562014-08-20 13:38:52 +08001334}
1335
1336XGL_VOID XGLAPI intelCmdDrawIndexedIndirect(
1337 XGL_CMD_BUFFER cmdBuffer,
1338 XGL_GPU_MEMORY mem,
1339 XGL_GPU_SIZE offset,
1340 XGL_UINT32 count,
1341 XGL_UINT32 stride)
1342{
Chia-I Wu59c097e2014-08-21 10:51:07 +08001343 struct intel_cmd *cmd = intel_cmd(cmdBuffer);
1344
1345 cmd->result = XGL_ERROR_UNKNOWN;
Chia-I Wub2755562014-08-20 13:38:52 +08001346}
1347
1348XGL_VOID XGLAPI intelCmdDispatch(
1349 XGL_CMD_BUFFER cmdBuffer,
1350 XGL_UINT x,
1351 XGL_UINT y,
1352 XGL_UINT z)
1353{
Chia-I Wu59c097e2014-08-21 10:51:07 +08001354 struct intel_cmd *cmd = intel_cmd(cmdBuffer);
1355
1356 cmd->result = XGL_ERROR_UNKNOWN;
Chia-I Wub2755562014-08-20 13:38:52 +08001357}
1358
1359XGL_VOID XGLAPI intelCmdDispatchIndirect(
1360 XGL_CMD_BUFFER cmdBuffer,
1361 XGL_GPU_MEMORY mem,
1362 XGL_GPU_SIZE offset)
1363{
Chia-I Wu59c097e2014-08-21 10:51:07 +08001364 struct intel_cmd *cmd = intel_cmd(cmdBuffer);
1365
1366 cmd->result = XGL_ERROR_UNKNOWN;
Chia-I Wub2755562014-08-20 13:38:52 +08001367}