blob: c97d4a132998555233a1dca09d544070ca4270dd [file] [log] [blame]
Chia-I Wu09142132014-08-11 15:42:55 +08001/*
2 * XGL
3 *
4 * Copyright (C) 2014 LunarG, Inc.
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the "Software"),
8 * to deal in the Software without restriction, including without limitation
9 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
10 * and/or sell copies of the Software, and to permit persons to whom the
11 * Software is furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice shall be included
14 * in all copies or substantial portions of the Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
21 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
22 * DEALINGS IN THE SOFTWARE.
23 */
24
Chia-I Wu730e5362014-08-19 12:15:09 +080025#include "genhw/genhw.h"
26#include "kmd/winsys.h"
27#include "dev.h"
Chia-I Wu343b1372014-08-20 16:39:20 +080028#include "mem.h"
Chia-I Wu730e5362014-08-19 12:15:09 +080029#include "obj.h"
Chia-I Wu00a23b22014-08-20 15:28:08 +080030#include "cmd_priv.h"
Chia-I Wu09142132014-08-11 15:42:55 +080031
Chia-I Wue24c3292014-08-21 14:05:23 +080032static XGL_RESULT cmd_writer_alloc_and_map(struct intel_cmd *cmd,
33 struct intel_cmd_writer *writer,
34 XGL_UINT size)
Chia-I Wu730e5362014-08-19 12:15:09 +080035{
36 struct intel_winsys *winsys = cmd->dev->winsys;
Chia-I Wue24c3292014-08-21 14:05:23 +080037 const XGL_GPU_SIZE bo_size = sizeof(uint32_t) * size;
Chia-I Wu730e5362014-08-19 12:15:09 +080038 struct intel_bo *bo;
39 void *ptr;
40
41 bo = intel_winsys_alloc_buffer(winsys,
42 "batch buffer", bo_size, INTEL_DOMAIN_CPU);
43 if (!bo)
44 return XGL_ERROR_OUT_OF_GPU_MEMORY;
45
46 ptr = intel_bo_map(bo, true);
47 if (!bo) {
48 intel_bo_unreference(bo);
49 return XGL_ERROR_MEMORY_MAP_FAILED;
50 }
51
Chia-I Wue24c3292014-08-21 14:05:23 +080052 writer->bo = bo;
53 writer->ptr_opaque = ptr;
54 writer->size = size;
55 writer->used = 0;
Chia-I Wu730e5362014-08-19 12:15:09 +080056
57 return XGL_SUCCESS;
58}
59
Chia-I Wu5e25c272014-08-21 20:19:12 +080060static void cmd_writer_copy(struct intel_cmd *cmd,
61 struct intel_cmd_writer *writer,
62 const uint32_t *vals, XGL_UINT len)
63{
64 assert(writer->used + len <= writer->size);
65 memcpy((uint32_t *) writer->ptr_opaque + writer->used,
66 vals, sizeof(uint32_t) * len);
67 writer->used += len;
68}
69
70static void cmd_writer_patch(struct intel_cmd *cmd,
71 struct intel_cmd_writer *writer,
72 XGL_UINT pos, uint32_t val)
73{
74 assert(pos < writer->used);
75 ((uint32_t *) writer->ptr_opaque)[pos] = val;
76}
77
Chia-I Wue24c3292014-08-21 14:05:23 +080078void cmd_writer_grow(struct intel_cmd *cmd,
79 struct intel_cmd_writer *writer)
Chia-I Wu730e5362014-08-19 12:15:09 +080080{
Chia-I Wue24c3292014-08-21 14:05:23 +080081 const XGL_UINT size = writer->size << 1;
82 const XGL_UINT old_used = writer->used;
83 struct intel_bo *old_bo = writer->bo;
84 void *old_ptr = writer->ptr_opaque;
85
86 if (size >= writer->size &&
87 cmd_writer_alloc_and_map(cmd, writer, size) == XGL_SUCCESS) {
88 cmd_writer_copy(cmd, writer, (const uint32_t *) old_ptr, old_used);
89
90 intel_bo_unmap(old_bo);
91 intel_bo_unreference(old_bo);
92 } else {
93 intel_dev_log(cmd->dev, XGL_DBG_MSG_ERROR,
94 XGL_VALIDATION_LEVEL_0, XGL_NULL_HANDLE, 0, 0,
95 "failed to grow command buffer of size %u", writer->size);
96
97 /* wrap it and fail silently */
98 writer->used = 0;
99 cmd->result = XGL_ERROR_OUT_OF_GPU_MEMORY;
100 }
Chia-I Wu730e5362014-08-19 12:15:09 +0800101}
102
Chia-I Wue24c3292014-08-21 14:05:23 +0800103static void cmd_writer_unmap(struct intel_cmd *cmd,
104 struct intel_cmd_writer *writer)
Chia-I Wu730e5362014-08-19 12:15:09 +0800105{
Chia-I Wue24c3292014-08-21 14:05:23 +0800106 intel_bo_unmap(writer->bo);
107 writer->ptr_opaque = NULL;
108}
109
110static void cmd_writer_free(struct intel_cmd *cmd,
111 struct intel_cmd_writer *writer)
112{
113 intel_bo_unreference(writer->bo);
114 writer->bo = NULL;
115}
116
117static void cmd_writer_reset(struct intel_cmd *cmd,
118 struct intel_cmd_writer *writer)
119{
120 /* do not reset writer->size as we want to know how big it has grown to */
121 writer->used = 0;
122
123 if (writer->ptr_opaque)
124 cmd_writer_unmap(cmd, writer);
125 if (writer->bo)
126 cmd_writer_free(cmd, writer);
127}
128
129static void cmd_unmap(struct intel_cmd *cmd)
130{
131 cmd_writer_unmap(cmd, &cmd->batch);
Chia-I Wu24565ee2014-08-21 20:24:31 +0800132 cmd_writer_unmap(cmd, &cmd->state);
Chia-I Wu1cbc0052014-08-25 09:50:12 +0800133 cmd_writer_unmap(cmd, &cmd->kernel);
Chia-I Wu730e5362014-08-19 12:15:09 +0800134}
135
136static void cmd_reset(struct intel_cmd *cmd)
137{
Chia-I Wue24c3292014-08-21 14:05:23 +0800138 cmd_writer_reset(cmd, &cmd->batch);
Chia-I Wu24565ee2014-08-21 20:24:31 +0800139 cmd_writer_reset(cmd, &cmd->state);
Chia-I Wu1cbc0052014-08-25 09:50:12 +0800140 cmd_writer_reset(cmd, &cmd->kernel);
Chia-I Wu343b1372014-08-20 16:39:20 +0800141 cmd->reloc_used = 0;
Chia-I Wu04966702014-08-20 15:05:03 +0800142 cmd->result = XGL_SUCCESS;
Chia-I Wu730e5362014-08-19 12:15:09 +0800143}
144
145static void cmd_destroy(struct intel_obj *obj)
146{
147 struct intel_cmd *cmd = intel_cmd_from_obj(obj);
148
149 intel_cmd_destroy(cmd);
150}
151
152XGL_RESULT intel_cmd_create(struct intel_dev *dev,
153 const XGL_CMD_BUFFER_CREATE_INFO *info,
154 struct intel_cmd **cmd_ret)
155{
156 struct intel_cmd *cmd;
157
158 cmd = (struct intel_cmd *) intel_base_create(dev, sizeof(*cmd),
159 dev->base.dbg, XGL_DBG_OBJECT_CMD_BUFFER, info, 0);
160 if (!cmd)
161 return XGL_ERROR_OUT_OF_MEMORY;
162
163 cmd->obj.destroy = cmd_destroy;
164
165 cmd->dev = dev;
Chia-I Wue24c3292014-08-21 14:05:23 +0800166
Chia-I Wue0cdd832014-08-25 12:38:56 +0800167 /*
168 * XXX This is not quite right. intel_gpu sets maxMemRefsPerSubmission to
169 * batch_buffer_reloc_count, but we may emit up to two relocs, for start
170 * and end offsets, for each referenced memories.
171 */
Chia-I Wu343b1372014-08-20 16:39:20 +0800172 cmd->reloc_count = dev->gpu->batch_buffer_reloc_count;
173 cmd->relocs = icd_alloc(sizeof(cmd->relocs[0]) * cmd->reloc_count,
174 4096, XGL_SYSTEM_ALLOC_INTERNAL);
175 if (!cmd->relocs) {
176 intel_cmd_destroy(cmd);
177 return XGL_ERROR_OUT_OF_MEMORY;
178 }
Chia-I Wu730e5362014-08-19 12:15:09 +0800179
180 *cmd_ret = cmd;
181
182 return XGL_SUCCESS;
183}
184
185void intel_cmd_destroy(struct intel_cmd *cmd)
186{
187 cmd_reset(cmd);
Chia-I Wue24c3292014-08-21 14:05:23 +0800188
189 icd_free(cmd->relocs);
Chia-I Wu730e5362014-08-19 12:15:09 +0800190 intel_base_destroy(&cmd->obj.base);
191}
192
193XGL_RESULT intel_cmd_begin(struct intel_cmd *cmd, XGL_FLAGS flags)
194{
Chia-I Wu24565ee2014-08-21 20:24:31 +0800195 XGL_RESULT ret;
Chia-I Wu730e5362014-08-19 12:15:09 +0800196
197 cmd_reset(cmd);
198
Chia-I Wu24565ee2014-08-21 20:24:31 +0800199 if (cmd->flags != flags) {
Chia-I Wue24c3292014-08-21 14:05:23 +0800200 cmd->flags = flags;
Chia-I Wu24565ee2014-08-21 20:24:31 +0800201 cmd->batch.size = 0;
Chia-I Wu730e5362014-08-19 12:15:09 +0800202 }
203
Chia-I Wu24565ee2014-08-21 20:24:31 +0800204 if (!cmd->batch.size) {
Chia-I Wu1cbc0052014-08-25 09:50:12 +0800205 const XGL_UINT size =
206 cmd->dev->gpu->max_batch_buffer_size / sizeof(uint32_t) / 2;
207 XGL_UINT divider = 1;
Chia-I Wu24565ee2014-08-21 20:24:31 +0800208
209 if (flags & XGL_CMD_BUFFER_OPTIMIZE_GPU_SMALL_BATCH_BIT)
210 divider *= 4;
211
Chia-I Wu1cbc0052014-08-25 09:50:12 +0800212 cmd->batch.size = size / divider;
213 cmd->state.size = size / divider;
214 cmd->kernel.size = 16384 / sizeof(uint32_t) / divider;
Chia-I Wu24565ee2014-08-21 20:24:31 +0800215 }
216
217 ret = cmd_writer_alloc_and_map(cmd, &cmd->batch, cmd->batch.size);
Chia-I Wu1cbc0052014-08-25 09:50:12 +0800218 if (ret == XGL_SUCCESS)
219 ret = cmd_writer_alloc_and_map(cmd, &cmd->state, cmd->state.size);
220 if (ret == XGL_SUCCESS)
221 ret = cmd_writer_alloc_and_map(cmd, &cmd->kernel, cmd->kernel.size);
222 if (ret != XGL_SUCCESS) {
223 cmd_reset(cmd);
Chia-I Wu24565ee2014-08-21 20:24:31 +0800224 return ret;
225 }
226
Chia-I Wu79dfbb32014-08-25 12:19:02 +0800227 cmd_batch_begin(cmd);
228
Chia-I Wu24565ee2014-08-21 20:24:31 +0800229 return XGL_SUCCESS;
Chia-I Wu730e5362014-08-19 12:15:09 +0800230}
231
232XGL_RESULT intel_cmd_end(struct intel_cmd *cmd)
233{
234 struct intel_winsys *winsys = cmd->dev->winsys;
Chia-I Wu343b1372014-08-20 16:39:20 +0800235 XGL_UINT i;
Chia-I Wu730e5362014-08-19 12:15:09 +0800236
Chia-I Wue24c3292014-08-21 14:05:23 +0800237 cmd_batch_end(cmd);
Chia-I Wu730e5362014-08-19 12:15:09 +0800238
Chia-I Wu343b1372014-08-20 16:39:20 +0800239 /* TODO we need a more "explicit" winsys */
Chia-I Wufdfb8ed2014-08-21 15:40:07 +0800240 for (i = 0; i < cmd->reloc_used; i++) {
Chia-I Wu343b1372014-08-20 16:39:20 +0800241 const struct intel_cmd_reloc *reloc = &cmd->relocs[i];
242 uint64_t presumed_offset;
243 int err;
244
Chia-I Wue24c3292014-08-21 14:05:23 +0800245 err = intel_bo_add_reloc(reloc->writer->bo,
Chia-I Wu9ee38722014-08-25 12:11:36 +0800246 sizeof(uint32_t) * reloc->pos, reloc->bo, reloc->val,
Chia-I Wue24c3292014-08-21 14:05:23 +0800247 reloc->read_domains, reloc->write_domain, &presumed_offset);
Chia-I Wu343b1372014-08-20 16:39:20 +0800248 if (err) {
249 cmd->result = XGL_ERROR_UNKNOWN;
250 break;
251 }
252
253 assert(presumed_offset == (uint64_t) (uint32_t) presumed_offset);
Chia-I Wue24c3292014-08-21 14:05:23 +0800254 cmd_writer_patch(cmd, reloc->writer, reloc->pos,
255 (uint32_t) presumed_offset);
Chia-I Wu343b1372014-08-20 16:39:20 +0800256 }
257
Chia-I Wu730e5362014-08-19 12:15:09 +0800258 cmd_unmap(cmd);
259
Chia-I Wu04966702014-08-20 15:05:03 +0800260 if (cmd->result != XGL_SUCCESS)
261 return cmd->result;
Chia-I Wue24c3292014-08-21 14:05:23 +0800262
263 if (intel_winsys_can_submit_bo(winsys, &cmd->batch.bo, 1))
Chia-I Wu730e5362014-08-19 12:15:09 +0800264 return XGL_SUCCESS;
265 else
266 return XGL_ERROR_TOO_MANY_MEMORY_REFERENCES;
267}
268
Chia-I Wu09142132014-08-11 15:42:55 +0800269XGL_RESULT XGLAPI intelCreateCommandBuffer(
270 XGL_DEVICE device,
271 const XGL_CMD_BUFFER_CREATE_INFO* pCreateInfo,
272 XGL_CMD_BUFFER* pCmdBuffer)
273{
Chia-I Wu730e5362014-08-19 12:15:09 +0800274 struct intel_dev *dev = intel_dev(device);
275
276 return intel_cmd_create(dev, pCreateInfo,
277 (struct intel_cmd **) pCmdBuffer);
Chia-I Wu09142132014-08-11 15:42:55 +0800278}
279
280XGL_RESULT XGLAPI intelBeginCommandBuffer(
281 XGL_CMD_BUFFER cmdBuffer,
282 XGL_FLAGS flags)
283{
Chia-I Wu730e5362014-08-19 12:15:09 +0800284 struct intel_cmd *cmd = intel_cmd(cmdBuffer);
285
286 return intel_cmd_begin(cmd, flags);
Chia-I Wu09142132014-08-11 15:42:55 +0800287}
288
289XGL_RESULT XGLAPI intelEndCommandBuffer(
290 XGL_CMD_BUFFER cmdBuffer)
291{
Chia-I Wu730e5362014-08-19 12:15:09 +0800292 struct intel_cmd *cmd = intel_cmd(cmdBuffer);
293
294 return intel_cmd_end(cmd);
Chia-I Wu09142132014-08-11 15:42:55 +0800295}
296
297XGL_RESULT XGLAPI intelResetCommandBuffer(
298 XGL_CMD_BUFFER cmdBuffer)
299{
Chia-I Wu730e5362014-08-19 12:15:09 +0800300 struct intel_cmd *cmd = intel_cmd(cmdBuffer);
301
302 cmd_reset(cmd);
303
304 return XGL_SUCCESS;
Chia-I Wu09142132014-08-11 15:42:55 +0800305}
306
Chia-I Wu09142132014-08-11 15:42:55 +0800307XGL_VOID XGLAPI intelCmdPrepareMemoryRegions(
308 XGL_CMD_BUFFER cmdBuffer,
309 XGL_UINT transitionCount,
310 const XGL_MEMORY_STATE_TRANSITION* pStateTransitions)
311{
312}
313
314XGL_VOID XGLAPI intelCmdPrepareImages(
315 XGL_CMD_BUFFER cmdBuffer,
316 XGL_UINT transitionCount,
317 const XGL_IMAGE_STATE_TRANSITION* pStateTransitions)
318{
319}
320
Chia-I Wu09142132014-08-11 15:42:55 +0800321XGL_VOID XGLAPI intelCmdCopyMemory(
322 XGL_CMD_BUFFER cmdBuffer,
323 XGL_GPU_MEMORY srcMem,
324 XGL_GPU_MEMORY destMem,
325 XGL_UINT regionCount,
326 const XGL_MEMORY_COPY* pRegions)
327{
328}
329
330XGL_VOID XGLAPI intelCmdCopyImage(
331 XGL_CMD_BUFFER cmdBuffer,
332 XGL_IMAGE srcImage,
333 XGL_IMAGE destImage,
334 XGL_UINT regionCount,
335 const XGL_IMAGE_COPY* pRegions)
336{
337}
338
339XGL_VOID XGLAPI intelCmdCopyMemoryToImage(
340 XGL_CMD_BUFFER cmdBuffer,
341 XGL_GPU_MEMORY srcMem,
342 XGL_IMAGE destImage,
343 XGL_UINT regionCount,
344 const XGL_MEMORY_IMAGE_COPY* pRegions)
345{
346}
347
348XGL_VOID XGLAPI intelCmdCopyImageToMemory(
349 XGL_CMD_BUFFER cmdBuffer,
350 XGL_IMAGE srcImage,
351 XGL_GPU_MEMORY destMem,
352 XGL_UINT regionCount,
353 const XGL_MEMORY_IMAGE_COPY* pRegions)
354{
355}
356
357XGL_VOID XGLAPI intelCmdCloneImageData(
358 XGL_CMD_BUFFER cmdBuffer,
359 XGL_IMAGE srcImage,
360 XGL_IMAGE_STATE srcImageState,
361 XGL_IMAGE destImage,
362 XGL_IMAGE_STATE destImageState)
363{
364}
365
366XGL_VOID XGLAPI intelCmdUpdateMemory(
367 XGL_CMD_BUFFER cmdBuffer,
368 XGL_GPU_MEMORY destMem,
369 XGL_GPU_SIZE destOffset,
370 XGL_GPU_SIZE dataSize,
371 const XGL_UINT32* pData)
372{
373}
374
375XGL_VOID XGLAPI intelCmdFillMemory(
376 XGL_CMD_BUFFER cmdBuffer,
377 XGL_GPU_MEMORY destMem,
378 XGL_GPU_SIZE destOffset,
379 XGL_GPU_SIZE fillSize,
380 XGL_UINT32 data)
381{
382}
383
384XGL_VOID XGLAPI intelCmdClearColorImage(
385 XGL_CMD_BUFFER cmdBuffer,
386 XGL_IMAGE image,
387 const XGL_FLOAT color[4],
388 XGL_UINT rangeCount,
389 const XGL_IMAGE_SUBRESOURCE_RANGE* pRanges)
390{
391}
392
393XGL_VOID XGLAPI intelCmdClearColorImageRaw(
394 XGL_CMD_BUFFER cmdBuffer,
395 XGL_IMAGE image,
396 const XGL_UINT32 color[4],
397 XGL_UINT rangeCount,
398 const XGL_IMAGE_SUBRESOURCE_RANGE* pRanges)
399{
400}
401
402XGL_VOID XGLAPI intelCmdClearDepthStencil(
403 XGL_CMD_BUFFER cmdBuffer,
404 XGL_IMAGE image,
405 XGL_FLOAT depth,
406 XGL_UINT32 stencil,
407 XGL_UINT rangeCount,
408 const XGL_IMAGE_SUBRESOURCE_RANGE* pRanges)
409{
410}
411
412XGL_VOID XGLAPI intelCmdResolveImage(
413 XGL_CMD_BUFFER cmdBuffer,
414 XGL_IMAGE srcImage,
415 XGL_IMAGE destImage,
416 XGL_UINT rectCount,
417 const XGL_IMAGE_RESOLVE* pRects)
418{
419}
420
421XGL_VOID XGLAPI intelCmdSetEvent(
422 XGL_CMD_BUFFER cmdBuffer,
423 XGL_EVENT event)
424{
425}
426
427XGL_VOID XGLAPI intelCmdResetEvent(
428 XGL_CMD_BUFFER cmdBuffer,
429 XGL_EVENT event)
430{
431}
432
433XGL_VOID XGLAPI intelCmdMemoryAtomic(
434 XGL_CMD_BUFFER cmdBuffer,
435 XGL_GPU_MEMORY destMem,
436 XGL_GPU_SIZE destOffset,
437 XGL_UINT64 srcData,
438 XGL_ATOMIC_OP atomicOp)
439{
440}
441
442XGL_VOID XGLAPI intelCmdBeginQuery(
443 XGL_CMD_BUFFER cmdBuffer,
444 XGL_QUERY_POOL queryPool,
445 XGL_UINT slot,
446 XGL_FLAGS flags)
447{
448}
449
450XGL_VOID XGLAPI intelCmdEndQuery(
451 XGL_CMD_BUFFER cmdBuffer,
452 XGL_QUERY_POOL queryPool,
453 XGL_UINT slot)
454{
455}
456
457XGL_VOID XGLAPI intelCmdResetQueryPool(
458 XGL_CMD_BUFFER cmdBuffer,
459 XGL_QUERY_POOL queryPool,
460 XGL_UINT startQuery,
461 XGL_UINT queryCount)
462{
463}
464
465XGL_VOID XGLAPI intelCmdWriteTimestamp(
466 XGL_CMD_BUFFER cmdBuffer,
467 XGL_TIMESTAMP_TYPE timestampType,
468 XGL_GPU_MEMORY destMem,
469 XGL_GPU_SIZE destOffset)
470{
471}
472
473XGL_VOID XGLAPI intelCmdInitAtomicCounters(
474 XGL_CMD_BUFFER cmdBuffer,
475 XGL_PIPELINE_BIND_POINT pipelineBindPoint,
476 XGL_UINT startCounter,
477 XGL_UINT counterCount,
478 const XGL_UINT32* pData)
479{
480}
481
482XGL_VOID XGLAPI intelCmdLoadAtomicCounters(
483 XGL_CMD_BUFFER cmdBuffer,
484 XGL_PIPELINE_BIND_POINT pipelineBindPoint,
485 XGL_UINT startCounter,
486 XGL_UINT counterCount,
487 XGL_GPU_MEMORY srcMem,
488 XGL_GPU_SIZE srcOffset)
489{
490}
491
492XGL_VOID XGLAPI intelCmdSaveAtomicCounters(
493 XGL_CMD_BUFFER cmdBuffer,
494 XGL_PIPELINE_BIND_POINT pipelineBindPoint,
495 XGL_UINT startCounter,
496 XGL_UINT counterCount,
497 XGL_GPU_MEMORY destMem,
498 XGL_GPU_SIZE destOffset)
499{
500}
501
502XGL_VOID XGLAPI intelCmdDbgMarkerBegin(
503 XGL_CMD_BUFFER cmdBuffer,
504 const XGL_CHAR* pMarker)
505{
506}
507
508XGL_VOID XGLAPI intelCmdDbgMarkerEnd(
509 XGL_CMD_BUFFER cmdBuffer)
510{
511}