blob: 253fe1ef39c65f03a1bf88cc534274fd26485664 [file] [log] [blame]
Chia-I Wub2755562014-08-20 13:38:52 +08001/*
2 * XGL
3 *
4 * Copyright (C) 2014 LunarG, Inc.
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the "Software"),
8 * to deal in the Software without restriction, including without limitation
9 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
10 * and/or sell copies of the Software, and to permit persons to whom the
11 * Software is furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice shall be included
14 * in all copies or substantial portions of the Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
21 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
22 * DEALINGS IN THE SOFTWARE.
23 */
24
Chia-I Wu9f039862014-08-20 15:39:56 +080025#include "genhw/genhw.h"
Chia-I Wub2755562014-08-20 13:38:52 +080026#include "dset.h"
Chia-I Wu7fae4e32014-08-21 11:39:44 +080027#include "img.h"
Chia-I Wub2755562014-08-20 13:38:52 +080028#include "mem.h"
Chia-I Wu018a3962014-08-21 10:37:52 +080029#include "pipeline.h"
Chia-I Wub2755562014-08-20 13:38:52 +080030#include "state.h"
31#include "view.h"
32#include "cmd_priv.h"
33
Chia-I Wu48c283d2014-08-25 23:13:46 +080034enum {
35 GEN6_WA_POST_SYNC_FLUSH = 1 << 0,
36 GEN6_WA_DS_FLUSH = 1 << 1,
37};
38
Chia-I Wu59c097e2014-08-21 10:51:07 +080039static void gen6_3DPRIMITIVE(struct intel_cmd *cmd,
Chia-I Wu254db422014-08-21 11:54:29 +080040 int prim_type, bool indexed,
Chia-I Wu59c097e2014-08-21 10:51:07 +080041 uint32_t vertex_count,
42 uint32_t vertex_start,
43 uint32_t instance_count,
44 uint32_t instance_start,
45 uint32_t vertex_base)
46{
47 const uint8_t cmd_len = 6;
48 uint32_t dw0;
49
50 CMD_ASSERT(cmd, 6, 6);
51
Chia-I Wu426072d2014-08-26 14:31:55 +080052 dw0 = GEN6_RENDER_CMD(3D, 3DPRIMITIVE) |
Chia-I Wu254db422014-08-21 11:54:29 +080053 prim_type << GEN6_3DPRIM_DW0_TYPE__SHIFT |
Chia-I Wu59c097e2014-08-21 10:51:07 +080054 (cmd_len - 2);
55
56 if (indexed)
57 dw0 |= GEN6_3DPRIM_DW0_ACCESS_RANDOM;
58
Chia-I Wue24c3292014-08-21 14:05:23 +080059 cmd_batch_reserve(cmd, cmd_len);
60 cmd_batch_write(cmd, dw0);
61 cmd_batch_write(cmd, vertex_count);
62 cmd_batch_write(cmd, vertex_start);
63 cmd_batch_write(cmd, instance_count);
64 cmd_batch_write(cmd, instance_start);
65 cmd_batch_write(cmd, vertex_base);
Chia-I Wu59c097e2014-08-21 10:51:07 +080066}
67
68static void gen7_3DPRIMITIVE(struct intel_cmd *cmd,
Chia-I Wu254db422014-08-21 11:54:29 +080069 int prim_type, bool indexed,
Chia-I Wu59c097e2014-08-21 10:51:07 +080070 uint32_t vertex_count,
71 uint32_t vertex_start,
72 uint32_t instance_count,
73 uint32_t instance_start,
74 uint32_t vertex_base)
75{
76 const uint8_t cmd_len = 7;
77 uint32_t dw0, dw1;
78
79 CMD_ASSERT(cmd, 7, 7.5);
80
Chia-I Wu426072d2014-08-26 14:31:55 +080081 dw0 = GEN6_RENDER_CMD(3D, 3DPRIMITIVE) | (cmd_len - 2);
Chia-I Wu254db422014-08-21 11:54:29 +080082 dw1 = prim_type << GEN7_3DPRIM_DW1_TYPE__SHIFT;
Chia-I Wu59c097e2014-08-21 10:51:07 +080083
84 if (indexed)
85 dw1 |= GEN7_3DPRIM_DW1_ACCESS_RANDOM;
86
Chia-I Wue24c3292014-08-21 14:05:23 +080087 cmd_batch_reserve(cmd, cmd_len);
88 cmd_batch_write(cmd, dw0);
89 cmd_batch_write(cmd, dw1);
90 cmd_batch_write(cmd, vertex_count);
91 cmd_batch_write(cmd, vertex_start);
92 cmd_batch_write(cmd, instance_count);
93 cmd_batch_write(cmd, instance_start);
94 cmd_batch_write(cmd, vertex_base);
Chia-I Wu59c097e2014-08-21 10:51:07 +080095}
96
Chia-I Wu270b1e82014-08-25 15:53:39 +080097static void gen6_PIPE_CONTROL(struct intel_cmd *cmd, uint32_t dw1,
98 struct intel_bo *bo, uint32_t bo_offset)
99{
100 const uint8_t cmd_len = 5;
Chia-I Wu426072d2014-08-26 14:31:55 +0800101 const uint32_t dw0 = GEN6_RENDER_CMD(3D, PIPE_CONTROL) |
Chia-I Wu270b1e82014-08-25 15:53:39 +0800102 (cmd_len - 2);
Chia-I Wu270b1e82014-08-25 15:53:39 +0800103
104 CMD_ASSERT(cmd, 6, 7.5);
105
106 assert(bo_offset % 8 == 0);
107
108 if (dw1 & GEN6_PIPE_CONTROL_CS_STALL) {
109 /*
110 * From the Sandy Bridge PRM, volume 2 part 1, page 73:
111 *
112 * "1 of the following must also be set (when CS stall is set):
113 *
114 * * Depth Cache Flush Enable ([0] of DW1)
115 * * Stall at Pixel Scoreboard ([1] of DW1)
116 * * Depth Stall ([13] of DW1)
117 * * Post-Sync Operation ([13] of DW1)
118 * * Render Target Cache Flush Enable ([12] of DW1)
119 * * Notify Enable ([8] of DW1)"
120 *
121 * From the Ivy Bridge PRM, volume 2 part 1, page 61:
122 *
123 * "One of the following must also be set (when CS stall is set):
124 *
125 * * Render Target Cache Flush Enable ([12] of DW1)
126 * * Depth Cache Flush Enable ([0] of DW1)
127 * * Stall at Pixel Scoreboard ([1] of DW1)
128 * * Depth Stall ([13] of DW1)
129 * * Post-Sync Operation ([13] of DW1)"
130 */
131 uint32_t bit_test = GEN6_PIPE_CONTROL_RENDER_CACHE_FLUSH |
132 GEN6_PIPE_CONTROL_DEPTH_CACHE_FLUSH |
133 GEN6_PIPE_CONTROL_PIXEL_SCOREBOARD_STALL |
134 GEN6_PIPE_CONTROL_DEPTH_STALL;
135
136 /* post-sync op */
137 bit_test |= GEN6_PIPE_CONTROL_WRITE_IMM |
138 GEN6_PIPE_CONTROL_WRITE_PS_DEPTH_COUNT |
139 GEN6_PIPE_CONTROL_WRITE_TIMESTAMP;
140
141 if (cmd_gen(cmd) == INTEL_GEN(6))
142 bit_test |= GEN6_PIPE_CONTROL_NOTIFY_ENABLE;
143
144 assert(dw1 & bit_test);
145 }
146
147 if (dw1 & GEN6_PIPE_CONTROL_DEPTH_STALL) {
148 /*
149 * From the Sandy Bridge PRM, volume 2 part 1, page 73:
150 *
151 * "Following bits must be clear (when Depth Stall is set):
152 *
153 * * Render Target Cache Flush Enable ([12] of DW1)
154 * * Depth Cache Flush Enable ([0] of DW1)"
155 */
156 assert(!(dw1 & (GEN6_PIPE_CONTROL_RENDER_CACHE_FLUSH |
157 GEN6_PIPE_CONTROL_DEPTH_CACHE_FLUSH)));
158 }
159
160 /*
161 * From the Sandy Bridge PRM, volume 1 part 3, page 19:
162 *
163 * "[DevSNB] PPGTT memory writes by MI_* (such as MI_STORE_DATA_IMM)
164 * and PIPE_CONTROL are not supported."
165 *
166 * The kernel will add the mapping automatically (when write domain is
167 * INTEL_DOMAIN_INSTRUCTION).
168 */
169 if (cmd_gen(cmd) == INTEL_GEN(6) && bo)
170 bo_offset |= GEN6_PIPE_CONTROL_DW2_USE_GGTT;
171
172 cmd_batch_reserve_reloc(cmd, cmd_len, (bool) bo);
173 cmd_batch_write(cmd, dw0);
174 cmd_batch_write(cmd, dw1);
Chia-I Wu32a22462014-08-26 14:13:46 +0800175 if (bo) {
176 cmd_batch_reloc(cmd, bo_offset, bo, INTEL_RELOC_GGTT |
177 INTEL_RELOC_WRITE);
178 } else {
Chia-I Wu270b1e82014-08-25 15:53:39 +0800179 cmd_batch_write(cmd, 0);
Chia-I Wu32a22462014-08-26 14:13:46 +0800180 }
Chia-I Wu270b1e82014-08-25 15:53:39 +0800181 cmd_batch_write(cmd, 0);
182 cmd_batch_write(cmd, 0);
183}
184
Chia-I Wu254db422014-08-21 11:54:29 +0800185static bool gen6_can_primitive_restart(const struct intel_cmd *cmd)
186{
187 const struct intel_pipeline *p = cmd->bind.pipeline.graphics;
188 bool supported;
189
190 CMD_ASSERT(cmd, 6, 7.5);
191
192 if (cmd_gen(cmd) >= INTEL_GEN(7.5))
193 return (p->prim_type != GEN6_3DPRIM_RECTLIST);
194
195 switch (p->prim_type) {
196 case GEN6_3DPRIM_POINTLIST:
197 case GEN6_3DPRIM_LINELIST:
198 case GEN6_3DPRIM_LINESTRIP:
199 case GEN6_3DPRIM_TRILIST:
200 case GEN6_3DPRIM_TRISTRIP:
201 supported = true;
202 break;
203 default:
204 supported = false;
205 break;
206 }
207
208 if (!supported)
209 return false;
210
211 switch (cmd->bind.index.type) {
212 case XGL_INDEX_8:
213 supported = (p->primitive_restart_index != 0xffu);
214 break;
215 case XGL_INDEX_16:
216 supported = (p->primitive_restart_index != 0xffffu);
217 break;
218 case XGL_INDEX_32:
219 supported = (p->primitive_restart_index != 0xffffffffu);
220 break;
221 default:
222 supported = false;
223 break;
224 }
225
226 return supported;
227}
228
Chia-I Wu59c097e2014-08-21 10:51:07 +0800229static void gen6_3DSTATE_INDEX_BUFFER(struct intel_cmd *cmd,
Chia-I Wu958d1b72014-08-21 11:28:11 +0800230 const struct intel_mem *mem,
Chia-I Wu59c097e2014-08-21 10:51:07 +0800231 XGL_GPU_SIZE offset,
232 XGL_INDEX_TYPE type,
233 bool enable_cut_index)
234{
235 const uint8_t cmd_len = 3;
236 uint32_t dw0, end_offset;
237 unsigned offset_align;
238
239 CMD_ASSERT(cmd, 6, 7.5);
240
Chia-I Wu426072d2014-08-26 14:31:55 +0800241 dw0 = GEN6_RENDER_CMD(3D, 3DSTATE_INDEX_BUFFER) | (cmd_len - 2);
Chia-I Wu59c097e2014-08-21 10:51:07 +0800242
243 /* the bit is moved to 3DSTATE_VF */
244 if (cmd_gen(cmd) >= INTEL_GEN(7.5))
245 assert(!enable_cut_index);
246 if (enable_cut_index)
247 dw0 |= GEN6_IB_DW0_CUT_INDEX_ENABLE;
248
249 switch (type) {
250 case XGL_INDEX_8:
251 dw0 |= GEN6_IB_DW0_FORMAT_BYTE;
252 offset_align = 1;
253 break;
254 case XGL_INDEX_16:
255 dw0 |= GEN6_IB_DW0_FORMAT_WORD;
256 offset_align = 2;
257 break;
258 case XGL_INDEX_32:
259 dw0 |= GEN6_IB_DW0_FORMAT_DWORD;
260 offset_align = 4;
261 break;
262 default:
263 cmd->result = XGL_ERROR_INVALID_VALUE;
264 return;
265 break;
266 }
267
268 if (offset % offset_align) {
269 cmd->result = XGL_ERROR_INVALID_VALUE;
270 return;
271 }
272
273 /* aligned and inclusive */
274 end_offset = mem->size - (mem->size % offset_align) - 1;
275
Chia-I Wu2de65d02014-08-25 10:02:53 +0800276 cmd_batch_reserve_reloc(cmd, cmd_len, 2);
Chia-I Wue24c3292014-08-21 14:05:23 +0800277 cmd_batch_write(cmd, dw0);
Chia-I Wu32a22462014-08-26 14:13:46 +0800278 cmd_batch_reloc(cmd, offset, mem->bo, 0);
279 cmd_batch_reloc(cmd, end_offset, mem->bo, 0);
Chia-I Wu59c097e2014-08-21 10:51:07 +0800280}
281
Chia-I Wu254db422014-08-21 11:54:29 +0800282static inline void
283gen75_3DSTATE_VF(struct intel_cmd *cmd,
284 bool enable_cut_index,
285 uint32_t cut_index)
286{
287 const uint8_t cmd_len = 2;
288 uint32_t dw0;
289
290 CMD_ASSERT(cmd, 7.5, 7.5);
291
Chia-I Wu426072d2014-08-26 14:31:55 +0800292 dw0 = GEN75_RENDER_CMD(3D, 3DSTATE_VF) | (cmd_len - 2);
Chia-I Wu254db422014-08-21 11:54:29 +0800293 if (enable_cut_index)
294 dw0 |= GEN75_VF_DW0_CUT_INDEX_ENABLE;
295
Chia-I Wue24c3292014-08-21 14:05:23 +0800296 cmd_batch_reserve(cmd, cmd_len);
297 cmd_batch_write(cmd, dw0);
298 cmd_batch_write(cmd, cut_index);
Chia-I Wu254db422014-08-21 11:54:29 +0800299}
300
Chia-I Wud88e02d2014-08-25 10:56:13 +0800301static void gen6_3DSTATE_DRAWING_RECTANGLE(struct intel_cmd *cmd,
302 XGL_UINT width, XGL_UINT height)
303{
304 const uint8_t cmd_len = 4;
Chia-I Wu426072d2014-08-26 14:31:55 +0800305 const uint32_t dw0 = GEN6_RENDER_CMD(3D, 3DSTATE_DRAWING_RECTANGLE) |
Chia-I Wud88e02d2014-08-25 10:56:13 +0800306 (cmd_len - 2);
307
308 CMD_ASSERT(cmd, 6, 7.5);
309
310 cmd_batch_reserve(cmd, cmd_len);
311 cmd_batch_write(cmd, dw0);
312 if (width && height) {
313 cmd_batch_write(cmd, 0);
314 cmd_batch_write(cmd, (height - 1) << 16 |
315 (width - 1));
316 } else {
317 cmd_batch_write(cmd, 1);
318 cmd_batch_write(cmd, 0);
319 }
320 cmd_batch_write(cmd, 0);
321}
322
Chia-I Wu7fae4e32014-08-21 11:39:44 +0800323static void gen6_3DSTATE_DEPTH_BUFFER(struct intel_cmd *cmd,
324 const struct intel_ds_view *view)
325{
326 const uint8_t cmd_len = 7;
327 uint32_t dw0;
328
329 CMD_ASSERT(cmd, 6, 7.5);
330
331 dw0 = (cmd_gen(cmd) >= INTEL_GEN(7)) ?
Chia-I Wu426072d2014-08-26 14:31:55 +0800332 GEN7_RENDER_CMD(3D, 3DSTATE_DEPTH_BUFFER) :
333 GEN6_RENDER_CMD(3D, 3DSTATE_DEPTH_BUFFER);
Chia-I Wu7fae4e32014-08-21 11:39:44 +0800334 dw0 |= (cmd_len - 2);
335
Chia-I Wu2de65d02014-08-25 10:02:53 +0800336 cmd_batch_reserve_reloc(cmd, cmd_len, (bool) view->img);
Chia-I Wue24c3292014-08-21 14:05:23 +0800337 cmd_batch_write(cmd, dw0);
338 cmd_batch_write(cmd, view->cmd[0]);
Courtney Goeltzenleuchtere316d972014-08-22 16:25:24 -0600339 if (view->img) {
Chia-I Wu9ee38722014-08-25 12:11:36 +0800340 cmd_batch_reloc(cmd, view->cmd[1], view->img->obj.mem->bo,
Chia-I Wu32a22462014-08-26 14:13:46 +0800341 INTEL_RELOC_WRITE);
Courtney Goeltzenleuchtere316d972014-08-22 16:25:24 -0600342 } else {
343 cmd_batch_write(cmd, 0);
344 }
Chia-I Wue24c3292014-08-21 14:05:23 +0800345 cmd_batch_write(cmd, view->cmd[2]);
346 cmd_batch_write(cmd, view->cmd[3]);
347 cmd_batch_write(cmd, view->cmd[4]);
348 cmd_batch_write(cmd, view->cmd[5]);
Chia-I Wu7fae4e32014-08-21 11:39:44 +0800349}
350
351static void gen6_3DSTATE_STENCIL_BUFFER(struct intel_cmd *cmd,
352 const struct intel_ds_view *view)
353{
354 const uint8_t cmd_len = 3;
355 uint32_t dw0;
356
357 CMD_ASSERT(cmd, 6, 7.5);
358
359 dw0 = (cmd_gen(cmd) >= INTEL_GEN(7)) ?
Chia-I Wu426072d2014-08-26 14:31:55 +0800360 GEN7_RENDER_CMD(3D, 3DSTATE_STENCIL_BUFFER) :
361 GEN6_RENDER_CMD(3D, 3DSTATE_STENCIL_BUFFER);
Chia-I Wu7fae4e32014-08-21 11:39:44 +0800362 dw0 |= (cmd_len - 2);
363
Chia-I Wu2de65d02014-08-25 10:02:53 +0800364 cmd_batch_reserve_reloc(cmd, cmd_len, (bool) view->img);
Chia-I Wue24c3292014-08-21 14:05:23 +0800365 cmd_batch_write(cmd, dw0);
366 cmd_batch_write(cmd, view->cmd[6]);
Courtney Goeltzenleuchtere316d972014-08-22 16:25:24 -0600367 if (view->img) {
Chia-I Wu9ee38722014-08-25 12:11:36 +0800368 cmd_batch_reloc(cmd, view->cmd[7], view->img->obj.mem->bo,
Chia-I Wu32a22462014-08-26 14:13:46 +0800369 INTEL_RELOC_WRITE);
Courtney Goeltzenleuchtere316d972014-08-22 16:25:24 -0600370 } else {
371 cmd_batch_write(cmd, 0);
372 }
Chia-I Wu7fae4e32014-08-21 11:39:44 +0800373}
374
375static void gen6_3DSTATE_HIER_DEPTH_BUFFER(struct intel_cmd *cmd,
376 const struct intel_ds_view *view)
377{
378 const uint8_t cmd_len = 3;
379 uint32_t dw0;
380
381 CMD_ASSERT(cmd, 6, 7.5);
382
383 dw0 = (cmd_gen(cmd) >= INTEL_GEN(7)) ?
Chia-I Wu426072d2014-08-26 14:31:55 +0800384 GEN7_RENDER_CMD(3D, 3DSTATE_HIER_DEPTH_BUFFER) :
385 GEN6_RENDER_CMD(3D, 3DSTATE_HIER_DEPTH_BUFFER);
Chia-I Wu7fae4e32014-08-21 11:39:44 +0800386 dw0 |= (cmd_len - 2);
387
Chia-I Wu2de65d02014-08-25 10:02:53 +0800388 cmd_batch_reserve_reloc(cmd, cmd_len, (bool) view->img);
Chia-I Wue24c3292014-08-21 14:05:23 +0800389 cmd_batch_write(cmd, dw0);
390 cmd_batch_write(cmd, view->cmd[8]);
Courtney Goeltzenleuchtere316d972014-08-22 16:25:24 -0600391 if (view->img) {
Chia-I Wu9ee38722014-08-25 12:11:36 +0800392 cmd_batch_reloc(cmd, view->cmd[9], view->img->obj.mem->bo,
Chia-I Wu32a22462014-08-26 14:13:46 +0800393 INTEL_RELOC_WRITE);
Courtney Goeltzenleuchtere316d972014-08-22 16:25:24 -0600394 } else {
395 cmd_batch_write(cmd, 0);
396 }
Chia-I Wu7fae4e32014-08-21 11:39:44 +0800397}
398
Chia-I Wuf8231032014-08-25 10:44:45 +0800399static void gen6_3DSTATE_CLEAR_PARAMS(struct intel_cmd *cmd,
400 uint32_t clear_val)
401{
402 const uint8_t cmd_len = 2;
Chia-I Wu426072d2014-08-26 14:31:55 +0800403 const uint32_t dw0 = GEN6_RENDER_CMD(3D, 3DSTATE_CLEAR_PARAMS) |
Chia-I Wuf8231032014-08-25 10:44:45 +0800404 GEN6_CLEAR_PARAMS_DW0_VALID |
405 (cmd_len - 2);
406
407 CMD_ASSERT(cmd, 6, 6);
408
409 cmd_batch_reserve(cmd, cmd_len);
410 cmd_batch_write(cmd, dw0);
411 cmd_batch_write(cmd, clear_val);
412}
413
414static void gen7_3DSTATE_CLEAR_PARAMS(struct intel_cmd *cmd,
415 uint32_t clear_val)
416{
417 const uint8_t cmd_len = 3;
Chia-I Wu426072d2014-08-26 14:31:55 +0800418 const uint32_t dw0 = GEN7_RENDER_CMD(3D, 3DSTATE_CLEAR_PARAMS) |
Chia-I Wuf8231032014-08-25 10:44:45 +0800419 (cmd_len - 2);
420
421 CMD_ASSERT(cmd, 7, 7.5);
422
423 cmd_batch_reserve(cmd, cmd_len);
424 cmd_batch_write(cmd, dw0);
425 cmd_batch_write(cmd, clear_val);
426 cmd_batch_write(cmd, 1);
427}
428
Chia-I Wu302742d2014-08-22 10:28:29 +0800429static void gen6_3DSTATE_CC_STATE_POINTERS(struct intel_cmd *cmd,
430 XGL_UINT blend_pos,
431 XGL_UINT ds_pos,
432 XGL_UINT cc_pos)
433{
434 const uint8_t cmd_len = 4;
435 uint32_t dw0;
436
437 CMD_ASSERT(cmd, 6, 6);
438
Chia-I Wu426072d2014-08-26 14:31:55 +0800439 dw0 = GEN6_RENDER_CMD(3D, 3DSTATE_CC_STATE_POINTERS) |
Chia-I Wu302742d2014-08-22 10:28:29 +0800440 (cmd_len - 2);
441
442 cmd_batch_reserve(cmd, cmd_len);
443 cmd_batch_write(cmd, dw0);
444 cmd_batch_write(cmd, (blend_pos << 2) | 1);
445 cmd_batch_write(cmd, (ds_pos << 2) | 1);
446 cmd_batch_write(cmd, (cc_pos << 2) | 1);
447}
448
Chia-I Wu1744cca2014-08-22 11:10:17 +0800449static void gen6_3DSTATE_VIEWPORT_STATE_POINTERS(struct intel_cmd *cmd,
450 XGL_UINT clip_pos,
451 XGL_UINT sf_pos,
452 XGL_UINT cc_pos)
453{
454 const uint8_t cmd_len = 4;
455 uint32_t dw0;
456
457 CMD_ASSERT(cmd, 6, 6);
458
Chia-I Wu426072d2014-08-26 14:31:55 +0800459 dw0 = GEN6_RENDER_CMD(3D, 3DSTATE_VIEWPORT_STATE_POINTERS) |
Chia-I Wu1744cca2014-08-22 11:10:17 +0800460 GEN6_PTR_VP_DW0_CLIP_CHANGED |
461 GEN6_PTR_VP_DW0_SF_CHANGED |
462 GEN6_PTR_VP_DW0_CC_CHANGED |
463 (cmd_len - 2);
464
465 cmd_batch_reserve(cmd, cmd_len);
466 cmd_batch_write(cmd, dw0);
467 cmd_batch_write(cmd, clip_pos << 2);
468 cmd_batch_write(cmd, sf_pos << 2);
469 cmd_batch_write(cmd, cc_pos << 2);
470}
471
472static void gen6_3DSTATE_SCISSOR_STATE_POINTERS(struct intel_cmd *cmd,
473 XGL_UINT scissor_pos)
474{
475 const uint8_t cmd_len = 2;
476 uint32_t dw0;
477
478 CMD_ASSERT(cmd, 6, 6);
479
Chia-I Wu426072d2014-08-26 14:31:55 +0800480 dw0 = GEN6_RENDER_CMD(3D, 3DSTATE_SCISSOR_STATE_POINTERS) |
Chia-I Wu1744cca2014-08-22 11:10:17 +0800481 (cmd_len - 2);
482
483 cmd_batch_reserve(cmd, cmd_len);
484 cmd_batch_write(cmd, dw0);
485 cmd_batch_write(cmd, scissor_pos << 2);
486}
487
Chia-I Wu42a56202014-08-23 16:47:48 +0800488static void gen6_3DSTATE_BINDING_TABLE_POINTERS(struct intel_cmd *cmd,
489 XGL_UINT vs_pos,
490 XGL_UINT gs_pos,
491 XGL_UINT ps_pos)
492{
493 const uint8_t cmd_len = 4;
494 uint32_t dw0;
495
496 CMD_ASSERT(cmd, 6, 6);
497
Chia-I Wu426072d2014-08-26 14:31:55 +0800498 dw0 = GEN6_RENDER_CMD(3D, 3DSTATE_BINDING_TABLE_POINTERS) |
Chia-I Wu42a56202014-08-23 16:47:48 +0800499 GEN6_PTR_BINDING_TABLE_DW0_VS_CHANGED |
500 GEN6_PTR_BINDING_TABLE_DW0_GS_CHANGED |
501 GEN6_PTR_BINDING_TABLE_DW0_PS_CHANGED |
502 (cmd_len - 2);
503
504 cmd_batch_reserve(cmd, cmd_len);
505 cmd_batch_write(cmd, dw0);
506 cmd_batch_write(cmd, vs_pos << 2);
507 cmd_batch_write(cmd, gs_pos << 2);
508 cmd_batch_write(cmd, ps_pos << 2);
509}
510
Chia-I Wu302742d2014-08-22 10:28:29 +0800511static void gen7_3dstate_pointer(struct intel_cmd *cmd,
512 int subop, XGL_UINT pos)
513{
514 const uint8_t cmd_len = 2;
515 const uint32_t dw0 = GEN6_RENDER_TYPE_RENDER |
516 GEN6_RENDER_SUBTYPE_3D |
517 subop | (cmd_len - 2);
518
519 cmd_batch_reserve(cmd, cmd_len);
520 cmd_batch_write(cmd, dw0);
521 cmd_batch_write(cmd, pos << 2);
522}
523
524static XGL_UINT gen6_BLEND_STATE(struct intel_cmd *cmd,
525 const struct intel_blend_state *state)
526{
527 const uint8_t cmd_align = GEN6_ALIGNMENT_BLEND_STATE;
528 const uint8_t cmd_len = XGL_MAX_COLOR_ATTACHMENTS * 2;
529
530 CMD_ASSERT(cmd, 6, 7.5);
531 STATIC_ASSERT(ARRAY_SIZE(state->cmd) >= cmd_len);
532
533 return cmd_state_copy(cmd, state->cmd, cmd_len, cmd_align);
534}
535
536static XGL_UINT gen6_DEPTH_STENCIL_STATE(struct intel_cmd *cmd,
537 const struct intel_ds_state *state)
538{
539 const uint8_t cmd_align = GEN6_ALIGNMENT_DEPTH_STENCIL_STATE;
540 const uint8_t cmd_len = 3;
541
542 CMD_ASSERT(cmd, 6, 7.5);
543 STATIC_ASSERT(ARRAY_SIZE(state->cmd) >= cmd_len);
544
545 return cmd_state_copy(cmd, state->cmd, cmd_len, cmd_align);
546}
547
548static XGL_UINT gen6_COLOR_CALC_STATE(struct intel_cmd *cmd,
549 uint32_t stencil_ref,
550 const uint32_t blend_color[4])
551{
552 const uint8_t cmd_align = GEN6_ALIGNMENT_COLOR_CALC_STATE;
553 const uint8_t cmd_len = 6;
554 XGL_UINT pos;
555 uint32_t *dw;
556
557 CMD_ASSERT(cmd, 6, 7.5);
558
559 dw = cmd_state_reserve(cmd, cmd_len, cmd_align, &pos);
560 dw[0] = stencil_ref;
561 dw[1] = 0;
562 dw[2] = blend_color[0];
563 dw[3] = blend_color[1];
564 dw[4] = blend_color[2];
565 dw[5] = blend_color[3];
566 cmd_state_advance(cmd, cmd_len);
567
568 return pos;
569}
570
Chia-I Wu48c283d2014-08-25 23:13:46 +0800571static void gen6_wa_post_sync_flush(struct intel_cmd *cmd)
572{
Chia-I Wu707a29e2014-08-27 12:51:47 +0800573 if (!cmd->bind.draw_count)
574 return;
575
Chia-I Wu48c283d2014-08-25 23:13:46 +0800576 if (cmd->bind.wa_flags & GEN6_WA_POST_SYNC_FLUSH)
577 return;
578
579 CMD_ASSERT(cmd, 6, 7.5);
580
581 cmd->bind.wa_flags |= GEN6_WA_POST_SYNC_FLUSH;
582
583 /*
584 * From the Sandy Bridge PRM, volume 2 part 1, page 60:
585 *
586 * "Pipe-control with CS-stall bit set must be sent BEFORE the
587 * pipe-control with a post-sync op and no write-cache flushes."
588 *
589 * The workaround below necessitates this workaround.
590 */
591 gen6_PIPE_CONTROL(cmd,
592 GEN6_PIPE_CONTROL_CS_STALL |
593 GEN6_PIPE_CONTROL_PIXEL_SCOREBOARD_STALL,
594 NULL, 0);
595
596 /*
597 * From the Sandy Bridge PRM, volume 2 part 1, page 60:
598 *
599 * "Before any depth stall flush (including those produced by
600 * non-pipelined state commands), software needs to first send a
601 * PIPE_CONTROL with no bits set except Post-Sync Operation != 0."
602 *
603 * "Before a PIPE_CONTROL with Write Cache Flush Enable =1, a
604 * PIPE_CONTROL with any non-zero post-sync-op is required."
605 */
606 gen6_PIPE_CONTROL(cmd, GEN6_PIPE_CONTROL_WRITE_IMM, cmd->scratch_bo, 0);
607}
608
Courtney Goeltzenleuchterf9e1a412014-08-27 13:59:36 -0600609static void gen6_wa_wm_multisample_flush(struct intel_cmd *cmd)
610{
611 CMD_ASSERT(cmd, 6, 6);
612
613 gen6_wa_post_sync_flush(cmd);
614
615 /*
616 * From the Sandy Bridge PRM, volume 2 part 1, page 305:
617 *
618 * "Driver must guarentee that all the caches in the depth pipe are
619 * flushed before this command (3DSTATE_MULTISAMPLE) is parsed. This
620 * requires driver to send a PIPE_CONTROL with a CS stall along with a
621 * Depth Flush prior to this command."
622 */
623 gen6_PIPE_CONTROL(cmd,
624 GEN6_PIPE_CONTROL_DEPTH_CACHE_FLUSH |
625 GEN6_PIPE_CONTROL_CS_STALL,
626 0, 0);
627}
628
Chia-I Wu48c283d2014-08-25 23:13:46 +0800629static void gen6_wa_ds_flush(struct intel_cmd *cmd)
630{
Chia-I Wu707a29e2014-08-27 12:51:47 +0800631 if (!cmd->bind.draw_count)
632 return;
633
Chia-I Wu48c283d2014-08-25 23:13:46 +0800634 if (cmd->bind.wa_flags & GEN6_WA_DS_FLUSH)
635 return;
636
637 CMD_ASSERT(cmd, 6, 7.5);
638
639 cmd->bind.wa_flags |= GEN6_WA_DS_FLUSH;
640
641 gen6_wa_post_sync_flush(cmd);
642
643 gen6_PIPE_CONTROL(cmd, GEN6_PIPE_CONTROL_DEPTH_STALL, NULL, 0);
644 gen6_PIPE_CONTROL(cmd, GEN6_PIPE_CONTROL_DEPTH_CACHE_FLUSH, NULL, 0);
645 gen6_PIPE_CONTROL(cmd, GEN6_PIPE_CONTROL_DEPTH_STALL, NULL, 0);
646}
647
Chia-I Wu525c6602014-08-27 10:22:34 +0800648void cmd_batch_flush(struct intel_cmd *cmd, uint32_t pipe_control_dw0)
649{
650 if (!cmd->bind.draw_count)
651 return;
652
653 assert(!(pipe_control_dw0 & GEN6_PIPE_CONTROL_WRITE__MASK));
654
655 if (pipe_control_dw0 & GEN6_PIPE_CONTROL_RENDER_CACHE_FLUSH)
656 gen6_wa_post_sync_flush(cmd);
657
658 gen6_PIPE_CONTROL(cmd, pipe_control_dw0, NULL, 0);
659}
660
Chia-I Wu302742d2014-08-22 10:28:29 +0800661static void gen6_cc_states(struct intel_cmd *cmd)
662{
663 const struct intel_blend_state *blend = cmd->bind.state.blend;
664 const struct intel_ds_state *ds = cmd->bind.state.ds;
665 XGL_UINT blend_pos, ds_pos, cc_pos;
Chia-I Wuce9f11f2014-08-22 10:38:51 +0800666 uint32_t stencil_ref;
667 uint32_t blend_color[4];
Chia-I Wu302742d2014-08-22 10:28:29 +0800668
669 CMD_ASSERT(cmd, 6, 6);
670
Chia-I Wuce9f11f2014-08-22 10:38:51 +0800671 if (blend) {
672 blend_pos = gen6_BLEND_STATE(cmd, blend);
673 memcpy(blend_color, blend->cmd_blend_color, sizeof(blend_color));
674 } else {
675 blend_pos = 0;
676 memset(blend_color, 0, sizeof(blend_color));
677 }
678
679 if (ds) {
680 ds_pos = gen6_DEPTH_STENCIL_STATE(cmd, ds);
681 stencil_ref = ds->cmd_stencil_ref;
682 } else {
683 ds_pos = 0;
684 stencil_ref = 0;
685 }
686
687 cc_pos = gen6_COLOR_CALC_STATE(cmd, stencil_ref, blend_color);
Chia-I Wu302742d2014-08-22 10:28:29 +0800688
689 gen6_3DSTATE_CC_STATE_POINTERS(cmd, blend_pos, ds_pos, cc_pos);
690}
691
Chia-I Wu1744cca2014-08-22 11:10:17 +0800692static void gen6_viewport_states(struct intel_cmd *cmd)
693{
694 const struct intel_viewport_state *viewport = cmd->bind.state.viewport;
695 XGL_UINT pos;
696
697 if (!viewport)
698 return;
699
700 pos = cmd_state_copy(cmd, viewport->cmd, viewport->cmd_len,
701 viewport->cmd_align);
702
703 gen6_3DSTATE_VIEWPORT_STATE_POINTERS(cmd,
704 pos + viewport->cmd_clip_offset,
705 pos,
706 pos + viewport->cmd_cc_offset);
707
708 pos = (viewport->scissor_enable) ?
709 pos + viewport->cmd_scissor_rect_offset : 0;
710
711 gen6_3DSTATE_SCISSOR_STATE_POINTERS(cmd, pos);
712}
713
Chia-I Wu302742d2014-08-22 10:28:29 +0800714static void gen7_cc_states(struct intel_cmd *cmd)
715{
716 const struct intel_blend_state *blend = cmd->bind.state.blend;
717 const struct intel_ds_state *ds = cmd->bind.state.ds;
Chia-I Wuce9f11f2014-08-22 10:38:51 +0800718 uint32_t stencil_ref;
719 uint32_t blend_color[4];
Chia-I Wu302742d2014-08-22 10:28:29 +0800720 XGL_UINT pos;
721
722 CMD_ASSERT(cmd, 7, 7.5);
723
Chia-I Wuce9f11f2014-08-22 10:38:51 +0800724 if (!blend && !ds)
725 return;
Chia-I Wu302742d2014-08-22 10:28:29 +0800726
Chia-I Wuce9f11f2014-08-22 10:38:51 +0800727 if (blend) {
728 pos = gen6_BLEND_STATE(cmd, blend);
729 gen7_3dstate_pointer(cmd,
730 GEN7_RENDER_OPCODE_3DSTATE_BLEND_STATE_POINTERS, pos);
Chia-I Wu302742d2014-08-22 10:28:29 +0800731
Chia-I Wuce9f11f2014-08-22 10:38:51 +0800732 memcpy(blend_color, blend->cmd_blend_color, sizeof(blend_color));
733 } else {
734 memset(blend_color, 0, sizeof(blend_color));
735 }
736
737 if (ds) {
738 pos = gen6_DEPTH_STENCIL_STATE(cmd, ds);
739 gen7_3dstate_pointer(cmd,
740 GEN7_RENDER_OPCODE_3DSTATE_DEPTH_STENCIL_STATE_POINTERS, pos);
741 } else {
742 stencil_ref = 0;
743 }
744
745 pos = gen6_COLOR_CALC_STATE(cmd, stencil_ref, blend_color);
Chia-I Wu302742d2014-08-22 10:28:29 +0800746 gen7_3dstate_pointer(cmd,
747 GEN6_RENDER_OPCODE_3DSTATE_CC_STATE_POINTERS, pos);
748}
749
Chia-I Wu1744cca2014-08-22 11:10:17 +0800750static void gen7_viewport_states(struct intel_cmd *cmd)
751{
752 const struct intel_viewport_state *viewport = cmd->bind.state.viewport;
753 XGL_UINT pos;
754
755 if (!viewport)
756 return;
757
758 pos = cmd_state_copy(cmd, viewport->cmd, viewport->cmd_len,
759 viewport->cmd_align);
760
761 gen7_3dstate_pointer(cmd,
762 GEN7_RENDER_OPCODE_3DSTATE_VIEWPORT_STATE_POINTERS_SF_CLIP, pos);
763 gen7_3dstate_pointer(cmd,
764 GEN7_RENDER_OPCODE_3DSTATE_VIEWPORT_STATE_POINTERS_CC,
765 pos + viewport->cmd_cc_offset);
766 if (viewport->scissor_enable) {
767 gen7_3dstate_pointer(cmd,
768 GEN6_RENDER_OPCODE_3DSTATE_SCISSOR_STATE_POINTERS,
769 pos + viewport->cmd_scissor_rect_offset);
770 }
771}
772
Chia-I Wu7fd5cac2014-08-27 13:19:29 +0800773static void gen6_pcb(struct intel_cmd *cmd, int subop,
774 const XGL_PIPELINE_SHADER *sh)
775{
776 const uint8_t cmd_len = 5;
777 const XGL_UINT alignment = 32;
778 const XGL_UINT max_size =
779 (subop == GEN6_RENDER_OPCODE_3DSTATE_CONSTANT_VS) ? 1024 : 2048;
780 const XGL_UINT max_pcb = 4;
781 uint32_t pcb[4] = { 0, 0, 0, 0 };
782 XGL_FLAGS pcb_enables = 0;
783 XGL_SIZE total_size = 0;
784 uint32_t dw0;
785 XGL_UINT i;
786
787 for (i = 0; i < sh->linkConstBufferCount; i++) {
788 const XGL_LINK_CONST_BUFFER *info = &sh->pLinkConstBufferInfo[i];
789 const XGL_SIZE size = u_align(info->bufferSize, alignment);
790 void *ptr;
791
792 if (info->bufferId >= max_pcb ||
793 pcb_enables & ((1 << info->bufferId)) ||
794 total_size + info->bufferSize > max_size) {
795 cmd->result = XGL_ERROR_UNKNOWN;
796 return;
797 }
798 if (!size)
799 continue;
800
801 pcb_enables |= 1 << info->bufferId;
802 total_size += size;
803
804 ptr = cmd_state_reserve(cmd, size / sizeof(uint32_t),
805 alignment / sizeof(uint32_t), &pcb[info->bufferId]);
806 memcpy(ptr, info->pBufferData, info->bufferSize);
807 cmd_state_advance(cmd, size / sizeof(uint32_t));
808
809 pcb[info->bufferId] |= size / alignment - 1;
810 }
811
812 dw0 = GEN6_RENDER_TYPE_RENDER |
813 GEN6_RENDER_SUBTYPE_3D |
814 subop |
815 pcb_enables << 12 |
816 (cmd_len - 2);
817
818 cmd_batch_reserve(cmd, cmd_len);
819 cmd_batch_write(cmd, dw0);
820 cmd_batch_write(cmd, pcb[0]);
821 cmd_batch_write(cmd, pcb[1]);
822 cmd_batch_write(cmd, pcb[2]);
823 cmd_batch_write(cmd, pcb[3]);
824}
825
826static void gen7_pcb(struct intel_cmd *cmd, int subop,
827 const XGL_PIPELINE_SHADER *sh)
828{
829 const uint8_t cmd_len = 7;
830 const uint32_t dw0 = GEN6_RENDER_TYPE_RENDER |
831 GEN6_RENDER_SUBTYPE_3D |
832 subop |
833 (cmd_len - 2);
834 const XGL_UINT alignment = 32;
835 const XGL_UINT max_size = 2048;
836 const XGL_UINT max_pcb = 4;
837 uint16_t pcb_len[4] = { 0, 0, 0, 0 };
838 uint32_t pcb[4] = { 0, 0, 0, 0 };
839 XGL_FLAGS pcb_enables = 0;
840 XGL_SIZE total_size = 0;
841 XGL_UINT i;
842
843 for (i = 0; i < sh->linkConstBufferCount; i++) {
844 const XGL_LINK_CONST_BUFFER *info = &sh->pLinkConstBufferInfo[i];
845 const XGL_SIZE size = u_align(info->bufferSize, alignment);
846 void *ptr;
847
848 if (info->bufferId >= max_pcb ||
849 pcb_enables & ((1 << info->bufferId)) ||
850 total_size + info->bufferSize > max_size) {
851 cmd->result = XGL_ERROR_UNKNOWN;
852 return;
853 }
854 if (!size)
855 continue;
856
857 pcb_enables |= 1 << info->bufferId;
858 total_size += size;
859
860 pcb_len[info->bufferId] = size / alignment;
861
862 ptr = cmd_state_reserve(cmd, size / sizeof(uint32_t),
863 alignment / sizeof(uint32_t), &pcb[info->bufferId]);
864 memcpy(ptr, info->pBufferData, info->bufferSize);
865 cmd_state_advance(cmd, size / sizeof(uint32_t));
866 }
867
868 /* no holes */
869 if (!u_is_pow2(pcb_enables + 1)) {
870 cmd->result = XGL_ERROR_UNKNOWN;
871 return;
872 }
873
874 cmd_batch_reserve(cmd, cmd_len);
875 cmd_batch_write(cmd, dw0);
876 cmd_batch_write(cmd, pcb_len[1] << 16 | pcb_len[0]);
877 cmd_batch_write(cmd, pcb_len[3] << 16 | pcb_len[2]);
878 cmd_batch_write(cmd, pcb[0]);
879 cmd_batch_write(cmd, pcb[1]);
880 cmd_batch_write(cmd, pcb[2]);
881 cmd_batch_write(cmd, pcb[3]);
882}
883
Chia-I Wu42a56202014-08-23 16:47:48 +0800884static void emit_ps_resources(struct intel_cmd *cmd,
885 const struct intel_rmap *rmap)
886{
887 const XGL_UINT surface_count = rmap->rt_count +
888 rmap->resource_count + rmap->uav_count;
889 uint32_t binding_table[256];
890 XGL_UINT pos, i;
891
892 assert(surface_count <= ARRAY_SIZE(binding_table));
893
894 for (i = 0; i < surface_count; i++) {
895 const struct intel_rmap_slot *slot = &rmap->slots[i];
896 uint32_t *dw;
897
898 switch (slot->path_len) {
899 case 0:
900 pos = 0;
901 break;
902 case INTEL_RMAP_SLOT_RT:
903 {
904 const struct intel_rt_view *view = cmd->bind.att.rt[i];
905
906 dw = cmd_state_reserve_reloc(cmd, view->cmd_len, 1,
907 GEN6_ALIGNMENT_SURFACE_STATE, &pos);
908
909 memcpy(dw, view->cmd, sizeof(uint32_t) * view->cmd_len);
Chia-I Wubda55fd2014-08-25 12:46:10 +0800910 cmd_state_reloc(cmd, 1, view->cmd[1], view->img->obj.mem->bo,
Chia-I Wu32a22462014-08-26 14:13:46 +0800911 INTEL_RELOC_WRITE);
Chia-I Wu42a56202014-08-23 16:47:48 +0800912 cmd_state_advance(cmd, view->cmd_len);
913 }
914 break;
915 case INTEL_RMAP_SLOT_DYN:
916 {
917 const struct intel_mem_view *view =
Chia-I Wu9f1722c2014-08-25 10:17:58 +0800918 &cmd->bind.dyn_view.graphics;
Chia-I Wu42a56202014-08-23 16:47:48 +0800919
920 dw = cmd_state_reserve_reloc(cmd, view->cmd_len, 1,
921 GEN6_ALIGNMENT_SURFACE_STATE, &pos);
922
923 memcpy(dw, view->cmd, sizeof(uint32_t) * view->cmd_len);
Chia-I Wubda55fd2014-08-25 12:46:10 +0800924 cmd_state_reloc(cmd, 1, view->cmd[1], view->mem->bo,
Chia-I Wu32a22462014-08-26 14:13:46 +0800925 INTEL_RELOC_WRITE);
Chia-I Wu42a56202014-08-23 16:47:48 +0800926 cmd_state_advance(cmd, view->cmd_len);
927 }
928 break;
929 case 1:
930 default:
931 /* TODO */
932 assert(!"no dset support");
933 break;
934 }
935
936 binding_table[i] = pos << 2;
937 }
938
939 pos = cmd_state_copy(cmd, binding_table, surface_count,
940 GEN6_ALIGNMENT_BINDING_TABLE_STATE);
941
942 if (cmd_gen(cmd) >= INTEL_GEN(7)) {
943 gen7_3dstate_pointer(cmd,
944 GEN7_RENDER_OPCODE_3DSTATE_BINDING_TABLE_POINTERS_PS, pos);
945 } else {
946 gen6_3DSTATE_BINDING_TABLE_POINTERS(cmd, 0, 0, pos);
947 }
948}
949
Chia-I Wu52500102014-08-22 00:46:04 +0800950static void emit_bounded_states(struct intel_cmd *cmd)
951{
952 const struct intel_msaa_state *msaa = cmd->bind.state.msaa;
953
954 /* TODO more states */
955
Chia-I Wu1744cca2014-08-22 11:10:17 +0800956 if (cmd_gen(cmd) >= INTEL_GEN(7)) {
Chia-I Wu302742d2014-08-22 10:28:29 +0800957 gen7_cc_states(cmd);
Chia-I Wu1744cca2014-08-22 11:10:17 +0800958 gen7_viewport_states(cmd);
Chia-I Wu7fd5cac2014-08-27 13:19:29 +0800959
960 gen7_pcb(cmd, GEN6_RENDER_OPCODE_3DSTATE_CONSTANT_VS,
961 &cmd->bind.pipeline.graphics->vs);
962 gen7_pcb(cmd, GEN6_RENDER_OPCODE_3DSTATE_CONSTANT_PS,
963 &cmd->bind.pipeline.graphics->fs);
Courtney Goeltzenleuchterf9e1a412014-08-27 13:59:36 -0600964 // TODO: URB
Chia-I Wu1744cca2014-08-22 11:10:17 +0800965 } else {
Courtney Goeltzenleuchterf9e1a412014-08-27 13:59:36 -0600966 /* need multisample flush on gen6 */
967 gen6_wa_wm_multisample_flush(cmd);
Chia-I Wu302742d2014-08-22 10:28:29 +0800968 gen6_cc_states(cmd);
Chia-I Wu1744cca2014-08-22 11:10:17 +0800969 gen6_viewport_states(cmd);
Chia-I Wu7fd5cac2014-08-27 13:19:29 +0800970
971 gen6_pcb(cmd, GEN6_RENDER_OPCODE_3DSTATE_CONSTANT_VS,
972 &cmd->bind.pipeline.graphics->vs);
973 gen6_pcb(cmd, GEN6_RENDER_OPCODE_3DSTATE_CONSTANT_PS,
974 &cmd->bind.pipeline.graphics->fs);
Chia-I Wu1744cca2014-08-22 11:10:17 +0800975 }
Chia-I Wu302742d2014-08-22 10:28:29 +0800976
Chia-I Wu42a56202014-08-23 16:47:48 +0800977 emit_ps_resources(cmd, cmd->bind.pipeline.graphics->fs_rmap);
978
Chia-I Wu52500102014-08-22 00:46:04 +0800979 /* 3DSTATE_MULTISAMPLE and 3DSTATE_SAMPLE_MASK */
Chia-I Wu48c283d2014-08-25 23:13:46 +0800980 gen6_wa_post_sync_flush(cmd);
Chia-I Wu52500102014-08-22 00:46:04 +0800981 cmd_batch_reserve(cmd, msaa->cmd_len);
982 cmd_batch_write_n(cmd, msaa->cmd, msaa->cmd_len);
983}
984
Chia-I Wu9f1722c2014-08-25 10:17:58 +0800985static void cmd_bind_graphics_pipeline(struct intel_cmd *cmd,
986 const struct intel_pipeline *pipeline)
987{
988 cmd->bind.pipeline.graphics = pipeline;
989}
990
991static void cmd_bind_compute_pipeline(struct intel_cmd *cmd,
992 const struct intel_pipeline *pipeline)
993{
994 cmd->bind.pipeline.compute = pipeline;
995}
996
997static void cmd_bind_graphics_delta(struct intel_cmd *cmd,
998 const struct intel_pipeline_delta *delta)
999{
1000 cmd->bind.pipeline.graphics_delta = delta;
1001}
1002
1003static void cmd_bind_compute_delta(struct intel_cmd *cmd,
1004 const struct intel_pipeline_delta *delta)
1005{
1006 cmd->bind.pipeline.compute_delta = delta;
1007}
1008
1009static void cmd_bind_graphics_dset(struct intel_cmd *cmd,
1010 const struct intel_dset *dset,
1011 XGL_UINT slot_offset)
1012{
1013 cmd->bind.dset.graphics = dset;
1014 cmd->bind.dset.graphics_offset = slot_offset;
1015}
1016
1017static void cmd_bind_compute_dset(struct intel_cmd *cmd,
1018 const struct intel_dset *dset,
1019 XGL_UINT slot_offset)
1020{
1021 cmd->bind.dset.compute = dset;
1022 cmd->bind.dset.compute_offset = slot_offset;
1023}
1024
1025static void cmd_bind_graphics_dyn_view(struct intel_cmd *cmd,
1026 const XGL_MEMORY_VIEW_ATTACH_INFO *info)
1027{
1028 intel_mem_view_init(&cmd->bind.dyn_view.graphics, cmd->dev, info);
1029}
1030
1031static void cmd_bind_compute_dyn_view(struct intel_cmd *cmd,
1032 const XGL_MEMORY_VIEW_ATTACH_INFO *info)
1033{
1034 intel_mem_view_init(&cmd->bind.dyn_view.compute, cmd->dev, info);
1035}
1036
1037static void cmd_bind_index_data(struct intel_cmd *cmd,
1038 const struct intel_mem *mem,
1039 XGL_GPU_SIZE offset, XGL_INDEX_TYPE type)
1040{
1041 if (cmd_gen(cmd) >= INTEL_GEN(7.5)) {
1042 gen6_3DSTATE_INDEX_BUFFER(cmd, mem, offset, type, false);
1043 } else {
1044 cmd->bind.index.mem = mem;
1045 cmd->bind.index.offset = offset;
1046 cmd->bind.index.type = type;
1047 }
1048}
1049
1050static void cmd_bind_rt(struct intel_cmd *cmd,
1051 const XGL_COLOR_ATTACHMENT_BIND_INFO *attachments,
1052 XGL_UINT count)
1053{
Chia-I Wud88e02d2014-08-25 10:56:13 +08001054 XGL_UINT width = 0, height = 0;
Chia-I Wu9f1722c2014-08-25 10:17:58 +08001055 XGL_UINT i;
1056
1057 for (i = 0; i < count; i++) {
1058 const XGL_COLOR_ATTACHMENT_BIND_INFO *att = &attachments[i];
1059 const struct intel_rt_view *rt = intel_rt_view(att->view);
Chia-I Wud88e02d2014-08-25 10:56:13 +08001060 const struct intel_layout *layout = &rt->img->layout;
1061
1062 if (i == 0) {
1063 width = layout->width0;
1064 height = layout->height0;
1065 } else {
1066 if (width > layout->width0)
1067 width = layout->width0;
1068 if (height > layout->height0)
1069 height = layout->height0;
1070 }
Chia-I Wu9f1722c2014-08-25 10:17:58 +08001071
1072 cmd->bind.att.rt[i] = rt;
1073 }
1074
1075 cmd->bind.att.rt_count = count;
Chia-I Wud88e02d2014-08-25 10:56:13 +08001076
Chia-I Wu48c283d2014-08-25 23:13:46 +08001077 gen6_wa_post_sync_flush(cmd);
Chia-I Wud88e02d2014-08-25 10:56:13 +08001078 gen6_3DSTATE_DRAWING_RECTANGLE(cmd, width, height);
Chia-I Wu9f1722c2014-08-25 10:17:58 +08001079}
1080
1081static void cmd_bind_ds(struct intel_cmd *cmd,
1082 const XGL_DEPTH_STENCIL_BIND_INFO *info)
1083{
1084 const struct intel_ds_view *ds;
1085
1086 if (info) {
1087 cmd->bind.att.ds = intel_ds_view(info->view);
1088 ds = cmd->bind.att.ds;
1089 } else {
1090 /* all zeros */
1091 static const struct intel_ds_view null_ds;
1092 ds = &null_ds;
1093 }
1094
Chia-I Wu48c283d2014-08-25 23:13:46 +08001095 gen6_wa_ds_flush(cmd);
Chia-I Wu9f1722c2014-08-25 10:17:58 +08001096 gen6_3DSTATE_DEPTH_BUFFER(cmd, ds);
1097 gen6_3DSTATE_STENCIL_BUFFER(cmd, ds);
1098 gen6_3DSTATE_HIER_DEPTH_BUFFER(cmd, ds);
Chia-I Wuf8231032014-08-25 10:44:45 +08001099
1100 if (cmd_gen(cmd) >= INTEL_GEN(7))
1101 gen7_3DSTATE_CLEAR_PARAMS(cmd, 0);
1102 else
1103 gen6_3DSTATE_CLEAR_PARAMS(cmd, 0);
Chia-I Wu9f1722c2014-08-25 10:17:58 +08001104}
1105
1106static void cmd_bind_viewport_state(struct intel_cmd *cmd,
1107 const struct intel_viewport_state *state)
1108{
1109 cmd->bind.state.viewport = state;
1110}
1111
1112static void cmd_bind_raster_state(struct intel_cmd *cmd,
1113 const struct intel_raster_state *state)
1114{
1115 cmd->bind.state.raster = state;
1116}
1117
1118static void cmd_bind_ds_state(struct intel_cmd *cmd,
1119 const struct intel_ds_state *state)
1120{
1121 cmd->bind.state.ds = state;
1122}
1123
1124static void cmd_bind_blend_state(struct intel_cmd *cmd,
1125 const struct intel_blend_state *state)
1126{
1127 cmd->bind.state.blend = state;
1128}
1129
1130static void cmd_bind_msaa_state(struct intel_cmd *cmd,
1131 const struct intel_msaa_state *state)
1132{
1133 cmd->bind.state.msaa = state;
1134}
1135
1136static void cmd_draw(struct intel_cmd *cmd,
1137 XGL_UINT vertex_start,
1138 XGL_UINT vertex_count,
1139 XGL_UINT instance_start,
1140 XGL_UINT instance_count,
1141 bool indexed,
1142 XGL_UINT vertex_base)
1143{
1144 const struct intel_pipeline *p = cmd->bind.pipeline.graphics;
1145
1146 emit_bounded_states(cmd);
1147
1148 if (indexed) {
1149 if (p->primitive_restart && !gen6_can_primitive_restart(cmd))
1150 cmd->result = XGL_ERROR_UNKNOWN;
1151
1152 if (cmd_gen(cmd) >= INTEL_GEN(7.5)) {
1153 gen75_3DSTATE_VF(cmd, p->primitive_restart,
1154 p->primitive_restart_index);
1155 } else {
1156 gen6_3DSTATE_INDEX_BUFFER(cmd, cmd->bind.index.mem,
1157 cmd->bind.index.offset, cmd->bind.index.type,
1158 p->primitive_restart);
1159 }
1160 } else {
1161 assert(!vertex_base);
1162 }
1163
1164 if (cmd_gen(cmd) >= INTEL_GEN(7)) {
1165 gen7_3DPRIMITIVE(cmd, p->prim_type, indexed, vertex_count,
1166 vertex_start, instance_count, instance_start, vertex_base);
1167 } else {
1168 gen6_3DPRIMITIVE(cmd, p->prim_type, indexed, vertex_count,
1169 vertex_start, instance_count, instance_start, vertex_base);
1170 }
Chia-I Wu48c283d2014-08-25 23:13:46 +08001171
Chia-I Wu707a29e2014-08-27 12:51:47 +08001172 cmd->bind.draw_count++;
Chia-I Wu48c283d2014-08-25 23:13:46 +08001173 /* need to re-emit all workarounds */
1174 cmd->bind.wa_flags = 0;
Chia-I Wu9f1722c2014-08-25 10:17:58 +08001175}
1176
Chia-I Wub2755562014-08-20 13:38:52 +08001177XGL_VOID XGLAPI intelCmdBindPipeline(
1178 XGL_CMD_BUFFER cmdBuffer,
1179 XGL_PIPELINE_BIND_POINT pipelineBindPoint,
1180 XGL_PIPELINE pipeline)
1181{
1182 struct intel_cmd *cmd = intel_cmd(cmdBuffer);
1183
1184 switch (pipelineBindPoint) {
1185 case XGL_PIPELINE_BIND_POINT_COMPUTE:
Chia-I Wu9f1722c2014-08-25 10:17:58 +08001186 cmd_bind_compute_pipeline(cmd, intel_pipeline(pipeline));
Chia-I Wub2755562014-08-20 13:38:52 +08001187 break;
1188 case XGL_PIPELINE_BIND_POINT_GRAPHICS:
Chia-I Wu9f1722c2014-08-25 10:17:58 +08001189 cmd_bind_graphics_pipeline(cmd, intel_pipeline(pipeline));
Chia-I Wub2755562014-08-20 13:38:52 +08001190 break;
1191 default:
Chia-I Wu9f1722c2014-08-25 10:17:58 +08001192 cmd->result = XGL_ERROR_INVALID_VALUE;
Chia-I Wub2755562014-08-20 13:38:52 +08001193 break;
1194 }
1195}
1196
1197XGL_VOID XGLAPI intelCmdBindPipelineDelta(
1198 XGL_CMD_BUFFER cmdBuffer,
1199 XGL_PIPELINE_BIND_POINT pipelineBindPoint,
1200 XGL_PIPELINE_DELTA delta)
1201{
1202 struct intel_cmd *cmd = intel_cmd(cmdBuffer);
1203
1204 switch (pipelineBindPoint) {
1205 case XGL_PIPELINE_BIND_POINT_COMPUTE:
Chia-I Wu9f1722c2014-08-25 10:17:58 +08001206 cmd_bind_compute_delta(cmd, delta);
Chia-I Wub2755562014-08-20 13:38:52 +08001207 break;
1208 case XGL_PIPELINE_BIND_POINT_GRAPHICS:
Chia-I Wu9f1722c2014-08-25 10:17:58 +08001209 cmd_bind_graphics_delta(cmd, delta);
Chia-I Wub2755562014-08-20 13:38:52 +08001210 break;
1211 default:
Chia-I Wu9f1722c2014-08-25 10:17:58 +08001212 cmd->result = XGL_ERROR_INVALID_VALUE;
Chia-I Wub2755562014-08-20 13:38:52 +08001213 break;
1214 }
1215}
1216
1217XGL_VOID XGLAPI intelCmdBindStateObject(
1218 XGL_CMD_BUFFER cmdBuffer,
1219 XGL_STATE_BIND_POINT stateBindPoint,
1220 XGL_STATE_OBJECT state)
1221{
1222 struct intel_cmd *cmd = intel_cmd(cmdBuffer);
1223
1224 switch (stateBindPoint) {
1225 case XGL_STATE_BIND_VIEWPORT:
Chia-I Wu9f1722c2014-08-25 10:17:58 +08001226 cmd_bind_viewport_state(cmd,
1227 intel_viewport_state((XGL_VIEWPORT_STATE_OBJECT) state));
Chia-I Wub2755562014-08-20 13:38:52 +08001228 break;
1229 case XGL_STATE_BIND_RASTER:
Chia-I Wu9f1722c2014-08-25 10:17:58 +08001230 cmd_bind_raster_state(cmd,
1231 intel_raster_state((XGL_RASTER_STATE_OBJECT) state));
Chia-I Wub2755562014-08-20 13:38:52 +08001232 break;
1233 case XGL_STATE_BIND_DEPTH_STENCIL:
Chia-I Wu9f1722c2014-08-25 10:17:58 +08001234 cmd_bind_ds_state(cmd,
1235 intel_ds_state((XGL_DEPTH_STENCIL_STATE_OBJECT) state));
Chia-I Wub2755562014-08-20 13:38:52 +08001236 break;
1237 case XGL_STATE_BIND_COLOR_BLEND:
Chia-I Wu9f1722c2014-08-25 10:17:58 +08001238 cmd_bind_blend_state(cmd,
1239 intel_blend_state((XGL_COLOR_BLEND_STATE_OBJECT) state));
Chia-I Wub2755562014-08-20 13:38:52 +08001240 break;
1241 case XGL_STATE_BIND_MSAA:
Chia-I Wu9f1722c2014-08-25 10:17:58 +08001242 cmd_bind_msaa_state(cmd,
1243 intel_msaa_state((XGL_MSAA_STATE_OBJECT) state));
Chia-I Wub2755562014-08-20 13:38:52 +08001244 break;
1245 default:
Chia-I Wu9f1722c2014-08-25 10:17:58 +08001246 cmd->result = XGL_ERROR_INVALID_VALUE;
Chia-I Wub2755562014-08-20 13:38:52 +08001247 break;
1248 }
1249}
1250
1251XGL_VOID XGLAPI intelCmdBindDescriptorSet(
1252 XGL_CMD_BUFFER cmdBuffer,
1253 XGL_PIPELINE_BIND_POINT pipelineBindPoint,
1254 XGL_UINT index,
1255 XGL_DESCRIPTOR_SET descriptorSet,
1256 XGL_UINT slotOffset)
1257{
1258 struct intel_cmd *cmd = intel_cmd(cmdBuffer);
1259 struct intel_dset *dset = intel_dset(descriptorSet);
1260
1261 assert(!index);
1262
1263 switch (pipelineBindPoint) {
1264 case XGL_PIPELINE_BIND_POINT_COMPUTE:
Chia-I Wu9f1722c2014-08-25 10:17:58 +08001265 cmd_bind_compute_dset(cmd, dset, slotOffset);
Chia-I Wub2755562014-08-20 13:38:52 +08001266 break;
1267 case XGL_PIPELINE_BIND_POINT_GRAPHICS:
Chia-I Wu9f1722c2014-08-25 10:17:58 +08001268 cmd_bind_graphics_dset(cmd, dset, slotOffset);
Chia-I Wub2755562014-08-20 13:38:52 +08001269 break;
1270 default:
Chia-I Wu9f1722c2014-08-25 10:17:58 +08001271 cmd->result = XGL_ERROR_INVALID_VALUE;
Chia-I Wub2755562014-08-20 13:38:52 +08001272 break;
1273 }
1274}
1275
1276XGL_VOID XGLAPI intelCmdBindDynamicMemoryView(
1277 XGL_CMD_BUFFER cmdBuffer,
1278 XGL_PIPELINE_BIND_POINT pipelineBindPoint,
1279 const XGL_MEMORY_VIEW_ATTACH_INFO* pMemView)
1280{
1281 struct intel_cmd *cmd = intel_cmd(cmdBuffer);
1282
1283 switch (pipelineBindPoint) {
1284 case XGL_PIPELINE_BIND_POINT_COMPUTE:
Chia-I Wu9f1722c2014-08-25 10:17:58 +08001285 cmd_bind_compute_dyn_view(cmd, pMemView);
Chia-I Wub2755562014-08-20 13:38:52 +08001286 break;
1287 case XGL_PIPELINE_BIND_POINT_GRAPHICS:
Chia-I Wu9f1722c2014-08-25 10:17:58 +08001288 cmd_bind_graphics_dyn_view(cmd, pMemView);
Chia-I Wub2755562014-08-20 13:38:52 +08001289 break;
1290 default:
Chia-I Wu9f1722c2014-08-25 10:17:58 +08001291 cmd->result = XGL_ERROR_INVALID_VALUE;
Chia-I Wub2755562014-08-20 13:38:52 +08001292 break;
1293 }
1294}
1295
1296XGL_VOID XGLAPI intelCmdBindIndexData(
1297 XGL_CMD_BUFFER cmdBuffer,
1298 XGL_GPU_MEMORY mem_,
1299 XGL_GPU_SIZE offset,
1300 XGL_INDEX_TYPE indexType)
1301{
1302 struct intel_cmd *cmd = intel_cmd(cmdBuffer);
1303 struct intel_mem *mem = intel_mem(mem_);
1304
Chia-I Wu9f1722c2014-08-25 10:17:58 +08001305 cmd_bind_index_data(cmd, mem, offset, indexType);
Chia-I Wub2755562014-08-20 13:38:52 +08001306}
1307
1308XGL_VOID XGLAPI intelCmdBindAttachments(
1309 XGL_CMD_BUFFER cmdBuffer,
1310 XGL_UINT colorAttachmentCount,
1311 const XGL_COLOR_ATTACHMENT_BIND_INFO* pColorAttachments,
1312 const XGL_DEPTH_STENCIL_BIND_INFO* pDepthStencilAttachment)
1313{
1314 struct intel_cmd *cmd = intel_cmd(cmdBuffer);
Chia-I Wub2755562014-08-20 13:38:52 +08001315
Chia-I Wu9f1722c2014-08-25 10:17:58 +08001316 cmd_bind_rt(cmd, pColorAttachments, colorAttachmentCount);
1317 cmd_bind_ds(cmd, pDepthStencilAttachment);
Chia-I Wub2755562014-08-20 13:38:52 +08001318}
1319
1320XGL_VOID XGLAPI intelCmdDraw(
1321 XGL_CMD_BUFFER cmdBuffer,
1322 XGL_UINT firstVertex,
1323 XGL_UINT vertexCount,
1324 XGL_UINT firstInstance,
1325 XGL_UINT instanceCount)
1326{
Chia-I Wu59c097e2014-08-21 10:51:07 +08001327 struct intel_cmd *cmd = intel_cmd(cmdBuffer);
Chia-I Wu59c097e2014-08-21 10:51:07 +08001328
Chia-I Wu9f1722c2014-08-25 10:17:58 +08001329 cmd_draw(cmd, firstVertex, vertexCount,
1330 firstInstance, instanceCount, false, 0);
Chia-I Wub2755562014-08-20 13:38:52 +08001331}
1332
1333XGL_VOID XGLAPI intelCmdDrawIndexed(
1334 XGL_CMD_BUFFER cmdBuffer,
1335 XGL_UINT firstIndex,
1336 XGL_UINT indexCount,
1337 XGL_INT vertexOffset,
1338 XGL_UINT firstInstance,
1339 XGL_UINT instanceCount)
1340{
Chia-I Wu59c097e2014-08-21 10:51:07 +08001341 struct intel_cmd *cmd = intel_cmd(cmdBuffer);
Chia-I Wu59c097e2014-08-21 10:51:07 +08001342
Chia-I Wu9f1722c2014-08-25 10:17:58 +08001343 cmd_draw(cmd, firstIndex, indexCount,
1344 firstInstance, instanceCount, true, vertexOffset);
Chia-I Wub2755562014-08-20 13:38:52 +08001345}
1346
1347XGL_VOID XGLAPI intelCmdDrawIndirect(
1348 XGL_CMD_BUFFER cmdBuffer,
1349 XGL_GPU_MEMORY mem,
1350 XGL_GPU_SIZE offset,
1351 XGL_UINT32 count,
1352 XGL_UINT32 stride)
1353{
Chia-I Wu59c097e2014-08-21 10:51:07 +08001354 struct intel_cmd *cmd = intel_cmd(cmdBuffer);
1355
1356 cmd->result = XGL_ERROR_UNKNOWN;
Chia-I Wub2755562014-08-20 13:38:52 +08001357}
1358
1359XGL_VOID XGLAPI intelCmdDrawIndexedIndirect(
1360 XGL_CMD_BUFFER cmdBuffer,
1361 XGL_GPU_MEMORY mem,
1362 XGL_GPU_SIZE offset,
1363 XGL_UINT32 count,
1364 XGL_UINT32 stride)
1365{
Chia-I Wu59c097e2014-08-21 10:51:07 +08001366 struct intel_cmd *cmd = intel_cmd(cmdBuffer);
1367
1368 cmd->result = XGL_ERROR_UNKNOWN;
Chia-I Wub2755562014-08-20 13:38:52 +08001369}
1370
1371XGL_VOID XGLAPI intelCmdDispatch(
1372 XGL_CMD_BUFFER cmdBuffer,
1373 XGL_UINT x,
1374 XGL_UINT y,
1375 XGL_UINT z)
1376{
Chia-I Wu59c097e2014-08-21 10:51:07 +08001377 struct intel_cmd *cmd = intel_cmd(cmdBuffer);
1378
1379 cmd->result = XGL_ERROR_UNKNOWN;
Chia-I Wub2755562014-08-20 13:38:52 +08001380}
1381
1382XGL_VOID XGLAPI intelCmdDispatchIndirect(
1383 XGL_CMD_BUFFER cmdBuffer,
1384 XGL_GPU_MEMORY mem,
1385 XGL_GPU_SIZE offset)
1386{
Chia-I Wu59c097e2014-08-21 10:51:07 +08001387 struct intel_cmd *cmd = intel_cmd(cmdBuffer);
1388
1389 cmd->result = XGL_ERROR_UNKNOWN;
Chia-I Wub2755562014-08-20 13:38:52 +08001390}