icd/intel/queue.c - platform/external/vulkan-validation-layers - Gitiles

 /*
  * XGL
  *
  * Copyright (C) 2014 LunarG, Inc.
  *
  * Permission is hereby granted, free of charge, to any person obtaining a
  * copy of this software and associated documentation files (the "Software"),
  * to deal in the Software without restriction, including without limitation
  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
  * and/or sell copies of the Software, and to permit persons to whom the
  * Software is furnished to do so, subject to the following conditions:
  *
  * The above copyright notice and this permission notice shall be included
  * in all copies or substantial portions of the Software.
  *
  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
  * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
  * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
  * DEALINGS IN THE SOFTWARE.
  *
  * Authors:
  *   Chia-I Wu <olv@lunarg.com>
  */

 #include "genhw/genhw.h"
 #include "kmd/winsys.h"
 #include "cmd.h"
 #include "dev.h"
 #include "fence.h"
 #include "queue.h"

 static XGL_RESULT queue_submit_bo(struct intel_queue *queue,
                                   struct intel_bo *bo,
                                   XGL_GPU_SIZE used)
 {
     struct intel_winsys *winsys = queue->dev->winsys;
     int err;

     if (intel_debug & INTEL_DEBUG_NOHW)
         err = 0;
     else
         err = intel_winsys_submit_bo(winsys, queue->ring, bo, used, 0);

     return (err) ? XGL_ERROR_UNKNOWN : XGL_SUCCESS;
 }

 static struct intel_bo *queue_create_bo(struct intel_queue *queue,
                                         XGL_GPU_SIZE size,
                                         const void *cmd,
                                         XGL_SIZE cmd_len)
 {
     struct intel_bo *bo;
     void *ptr;

     bo = intel_winsys_alloc_buffer(queue->dev->winsys,
             "queue bo", size, true);
     if (!bo)
         return NULL;

     if (!cmd_len)
         return bo;

     ptr = intel_bo_map(bo, true);
     if (!ptr) {
         intel_bo_unreference(bo);
         return NULL;
     }

     memcpy(ptr, cmd, cmd_len);
     intel_bo_unmap(bo);

     return bo;
 }

 static XGL_RESULT queue_select_pipeline(struct intel_queue *queue,
                                         int pipeline_select)
 {
     uint32_t pipeline_select_cmd[] = {
         GEN6_RENDER_CMD(SINGLE_DW, PIPELINE_SELECT),
         GEN6_MI_CMD(MI_BATCH_BUFFER_END),
     };
     struct intel_bo *bo;
     XGL_RESULT ret;

     if (queue->ring != INTEL_RING_RENDER ||
         queue->last_pipeline_select == pipeline_select)
         return XGL_SUCCESS;

     switch (pipeline_select) {
     case GEN6_PIPELINE_SELECT_DW0_SELECT_3D:
         bo = queue->select_graphics_bo;
         break;
     case GEN6_PIPELINE_SELECT_DW0_SELECT_MEDIA:
         bo = queue->select_compute_bo;
         break;
     default:
         return XGL_ERROR_INVALID_VALUE;
         break;
     }

     if (!bo) {
         pipeline_select_cmd[0] |= pipeline_select;
         bo = queue_create_bo(queue, sizeof(pipeline_select_cmd),
                 pipeline_select_cmd, sizeof(pipeline_select_cmd));
         if (!bo)
             return XGL_ERROR_OUT_OF_GPU_MEMORY;

         switch (pipeline_select) {
         case GEN6_PIPELINE_SELECT_DW0_SELECT_3D:
             queue->select_graphics_bo = bo;
             break;
         case GEN6_PIPELINE_SELECT_DW0_SELECT_MEDIA:
             queue->select_compute_bo = bo;
             break;
         default:
             break;
         }
     }

     ret = queue_submit_bo(queue, bo, sizeof(pipeline_select_cmd));
     if (ret == XGL_SUCCESS)
         queue->last_pipeline_select = pipeline_select;

     return ret;
 }

 static XGL_RESULT queue_init_hw_and_atomic_bo(struct intel_queue *queue)
 {
     const uint32_t ctx_init_cmd[] = {
         /* STATE_SIP */
         GEN6_RENDER_CMD(COMMON, STATE_SIP),
         0,
         /* PIPELINE_SELECT */
         GEN6_RENDER_CMD(SINGLE_DW, PIPELINE_SELECT) |
             GEN6_PIPELINE_SELECT_DW0_SELECT_3D,
         /* 3DSTATE_VF_STATISTICS */
         GEN6_RENDER_CMD(SINGLE_DW, 3DSTATE_VF_STATISTICS),
         /* end */
         GEN6_MI_CMD(MI_BATCH_BUFFER_END),
         GEN6_MI_CMD(MI_NOOP),
     };
     struct intel_bo *bo;
     XGL_RESULT ret;

     if (queue->ring != INTEL_RING_RENDER) {
         queue->last_pipeline_select = -1;
         queue->atomic_bo = queue_create_bo(queue,
                 sizeof(uint32_t) * INTEL_QUEUE_ATOMIC_COUNTER_COUNT,
                 NULL, 0);
         return (queue->atomic_bo) ? XGL_SUCCESS : XGL_ERROR_OUT_OF_GPU_MEMORY;
     }

     bo = queue_create_bo(queue,
             sizeof(uint32_t) * INTEL_QUEUE_ATOMIC_COUNTER_COUNT,
             ctx_init_cmd, sizeof(ctx_init_cmd));
     if (!bo)
         return XGL_ERROR_OUT_OF_GPU_MEMORY;

     ret = queue_submit_bo(queue, bo, sizeof(ctx_init_cmd));
     if (ret != XGL_SUCCESS) {
         intel_bo_unreference(bo);
         return ret;
     }

     queue->last_pipeline_select = GEN6_PIPELINE_SELECT_DW0_SELECT_3D;
     /* reuse */
     queue->atomic_bo = bo;

     return XGL_SUCCESS;
 }

 XGL_RESULT intel_queue_create(struct intel_dev *dev,
                               enum intel_gpu_engine_type engine,
                               struct intel_queue **queue_ret)
 {
     struct intel_queue *queue;
     enum intel_ring_type ring;

     switch (engine) {
     case INTEL_GPU_ENGINE_3D:
         ring = INTEL_RING_RENDER;
         break;
     default:
         return XGL_ERROR_INVALID_VALUE;
         break;
     }

     queue = (struct intel_queue *) intel_base_create(dev, sizeof(*queue),
             dev->base.dbg, XGL_DBG_OBJECT_QUEUE, NULL, 0);
     if (!queue)
         return XGL_ERROR_OUT_OF_MEMORY;

     queue->dev = dev;
     queue->ring = ring;

     if (queue_init_hw_and_atomic_bo(queue) != XGL_SUCCESS) {
         intel_queue_destroy(queue);
         return XGL_ERROR_INITIALIZATION_FAILED;
     }

     *queue_ret = queue;

     return XGL_SUCCESS;
 }

 void intel_queue_destroy(struct intel_queue *queue)
 {
     if (queue->atomic_bo)
         intel_bo_unreference(queue->atomic_bo);
     if (queue->select_graphics_bo)
         intel_bo_unreference(queue->select_graphics_bo);
     if (queue->select_compute_bo)
         intel_bo_unreference(queue->select_compute_bo);
     intel_base_destroy(&queue->base);
 }

 XGL_RESULT intel_queue_wait(struct intel_queue *queue, int64_t timeout)
 {
     struct intel_bo *bo = (queue->last_submitted_cmd) ?
         intel_cmd_get_batch(queue->last_submitted_cmd, NULL) : NULL;

     return (!bo || intel_bo_wait(bo, timeout) == 0) ?
         XGL_SUCCESS : XGL_ERROR_UNKNOWN;
 }

 XGL_RESULT XGLAPI intelQueueSetGlobalMemReferences(
     XGL_QUEUE                                   queue,
     XGL_UINT                                    memRefCount,
     const XGL_MEMORY_REF*                       pMemRefs)
 {
     /*
      * The winwys maintains the list of memory references.  These are ignored
      * until we move away from the winsys.
      */
     return XGL_SUCCESS;
 }

 XGL_RESULT XGLAPI intelQueueWaitIdle(
     XGL_QUEUE                                   queue_)
 {
     struct intel_queue *queue = intel_queue(queue_);

     return intel_queue_wait(queue, -1);
 }

 XGL_RESULT XGLAPI intelQueueSubmit(
     XGL_QUEUE                                   queue_,
     XGL_UINT                                    cmdBufferCount,
     const XGL_CMD_BUFFER*                       pCmdBuffers,
     XGL_UINT                                    memRefCount,
     const XGL_MEMORY_REF*                       pMemRefs,
     XGL_FENCE                                   fence_)
 {
     struct intel_queue *queue = intel_queue(queue_);
     XGL_RESULT ret = XGL_SUCCESS;
     XGL_UINT i;

     for (i = 0; i < cmdBufferCount; i++) {
         struct intel_cmd *cmd = intel_cmd(pCmdBuffers[i]);
         struct intel_bo *bo;
         XGL_GPU_SIZE used;
         XGL_RESULT ret;

         ret = queue_select_pipeline(queue, cmd->pipeline_select);
         if (ret != XGL_SUCCESS)
             break;

         bo = intel_cmd_get_batch(cmd, &used);
         ret = queue_submit_bo(queue, bo, used);
         queue->last_submitted_cmd = cmd;

         if (intel_debug & INTEL_DEBUG_BATCH)
             intel_cmd_decode(cmd);

         if (ret != XGL_SUCCESS)
             break;
     }

     if (ret == XGL_SUCCESS && fence_ != XGL_NULL_HANDLE) {
         struct intel_fence *fence = intel_fence(fence_);
         intel_fence_set_cmd(fence, queue->last_submitted_cmd);
     }

     /* XGL_MEMORY_REFs are ignored as the winsys already knows them */

     return ret;
 }

 XGL_RESULT XGLAPI intelOpenSharedQueueSemaphore(
     XGL_DEVICE                                  device,
     const XGL_QUEUE_SEMAPHORE_OPEN_INFO*        pOpenInfo,
     XGL_QUEUE_SEMAPHORE*                        pSemaphore)
 {
     return XGL_ERROR_UNAVAILABLE;
 }

 XGL_RESULT XGLAPI intelCreateQueueSemaphore(
     XGL_DEVICE                                  device,
     const XGL_QUEUE_SEMAPHORE_CREATE_INFO*      pCreateInfo,
     XGL_QUEUE_SEMAPHORE*                        pSemaphore)
 {
     /*
      * We want to find an unused semaphore register and initialize it.  Signal
      * will increment the register.  Wait will atomically decrement it and
      * block if the value is zero, or a large constant N if we do not want to
      * go negative.
      *
      * XXX However, MI_SEMAPHORE_MBOX does not seem to have the flexibility.
      */
     return XGL_ERROR_UNAVAILABLE;
 }

 XGL_RESULT XGLAPI intelSignalQueueSemaphore(
     XGL_QUEUE                                   queue,
     XGL_QUEUE_SEMAPHORE                         semaphore)
 {
     return XGL_ERROR_UNAVAILABLE;
 }

 XGL_RESULT XGLAPI intelWaitQueueSemaphore(
     XGL_QUEUE                                   queue,
     XGL_QUEUE_SEMAPHORE                         semaphore)
 {
     return XGL_ERROR_UNAVAILABLE;
 }
	/*
	* XGL
	*
	* Copyright (C) 2014 LunarG, Inc.
	*
	* Permission is hereby granted, free of charge, to any person obtaining a
	* copy of this software and associated documentation files (the "Software"),
	* to deal in the Software without restriction, including without limitation
	* the rights to use, copy, modify, merge, publish, distribute, sublicense,
	* and/or sell copies of the Software, and to permit persons to whom the
	* Software is furnished to do so, subject to the following conditions:
	*
	* The above copyright notice and this permission notice shall be included
	* in all copies or substantial portions of the Software.
	*
	* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
	* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
	* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
	* THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
	* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
	* FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
	* DEALINGS IN THE SOFTWARE.
	*
	* Authors:
	* Chia-I Wu <olv@lunarg.com>
	*/

	#include "genhw/genhw.h"
	#include "kmd/winsys.h"
	#include "cmd.h"
	#include "dev.h"
	#include "fence.h"
	#include "queue.h"

	static XGL_RESULT queue_submit_bo(struct intel_queue *queue,
	struct intel_bo *bo,
	XGL_GPU_SIZE used)
	{
	struct intel_winsys *winsys = queue->dev->winsys;
	int err;

	if (intel_debug & INTEL_DEBUG_NOHW)
	err = 0;
	else
	err = intel_winsys_submit_bo(winsys, queue->ring, bo, used, 0);

	return (err) ? XGL_ERROR_UNKNOWN : XGL_SUCCESS;
	}

	static struct intel_bo queue_create_bo(struct intel_queue queue,
	XGL_GPU_SIZE size,
	const void *cmd,
	XGL_SIZE cmd_len)
	{
	struct intel_bo *bo;
	void *ptr;

	bo = intel_winsys_alloc_buffer(queue->dev->winsys,
	"queue bo", size, true);
	if (!bo)
	return NULL;

	if (!cmd_len)
	return bo;

	ptr = intel_bo_map(bo, true);
	if (!ptr) {
	intel_bo_unreference(bo);
	return NULL;
	}

	memcpy(ptr, cmd, cmd_len);
	intel_bo_unmap(bo);

	return bo;
	}

	static XGL_RESULT queue_select_pipeline(struct intel_queue *queue,
	int pipeline_select)
	{
	uint32_t pipeline_select_cmd[] = {
	GEN6_RENDER_CMD(SINGLE_DW, PIPELINE_SELECT),
	GEN6_MI_CMD(MI_BATCH_BUFFER_END),
	};
	struct intel_bo *bo;
	XGL_RESULT ret;

	if (queue->ring != INTEL_RING_RENDER \|\|
	queue->last_pipeline_select == pipeline_select)
	return XGL_SUCCESS;

	switch (pipeline_select) {
	case GEN6_PIPELINE_SELECT_DW0_SELECT_3D:
	bo = queue->select_graphics_bo;
	break;
	case GEN6_PIPELINE_SELECT_DW0_SELECT_MEDIA:
	bo = queue->select_compute_bo;
	break;
	default:
	return XGL_ERROR_INVALID_VALUE;
	break;
	}

	if (!bo) {
	pipeline_select_cmd[0] \|= pipeline_select;
	bo = queue_create_bo(queue, sizeof(pipeline_select_cmd),
	pipeline_select_cmd, sizeof(pipeline_select_cmd));
	if (!bo)
	return XGL_ERROR_OUT_OF_GPU_MEMORY;

	switch (pipeline_select) {
	case GEN6_PIPELINE_SELECT_DW0_SELECT_3D:
	queue->select_graphics_bo = bo;
	break;
	case GEN6_PIPELINE_SELECT_DW0_SELECT_MEDIA:
	queue->select_compute_bo = bo;
	break;
	default:
	break;
	}
	}

	ret = queue_submit_bo(queue, bo, sizeof(pipeline_select_cmd));
	if (ret == XGL_SUCCESS)
	queue->last_pipeline_select = pipeline_select;

	return ret;
	}

	static XGL_RESULT queue_init_hw_and_atomic_bo(struct intel_queue *queue)
	{
	const uint32_t ctx_init_cmd[] = {
	/* STATE_SIP */
	GEN6_RENDER_CMD(COMMON, STATE_SIP),
	0,
	/* PIPELINE_SELECT */
	GEN6_RENDER_CMD(SINGLE_DW, PIPELINE_SELECT) \|
	GEN6_PIPELINE_SELECT_DW0_SELECT_3D,
	/* 3DSTATE_VF_STATISTICS */
	GEN6_RENDER_CMD(SINGLE_DW, 3DSTATE_VF_STATISTICS),
	/* end */
	GEN6_MI_CMD(MI_BATCH_BUFFER_END),
	GEN6_MI_CMD(MI_NOOP),
	};
	struct intel_bo *bo;
	XGL_RESULT ret;

	if (queue->ring != INTEL_RING_RENDER) {
	queue->last_pipeline_select = -1;
	queue->atomic_bo = queue_create_bo(queue,
	sizeof(uint32_t) * INTEL_QUEUE_ATOMIC_COUNTER_COUNT,
	NULL, 0);
	return (queue->atomic_bo) ? XGL_SUCCESS : XGL_ERROR_OUT_OF_GPU_MEMORY;
	}

	bo = queue_create_bo(queue,
	sizeof(uint32_t) * INTEL_QUEUE_ATOMIC_COUNTER_COUNT,
	ctx_init_cmd, sizeof(ctx_init_cmd));
	if (!bo)
	return XGL_ERROR_OUT_OF_GPU_MEMORY;

	ret = queue_submit_bo(queue, bo, sizeof(ctx_init_cmd));
	if (ret != XGL_SUCCESS) {
	intel_bo_unreference(bo);
	return ret;
	}

	queue->last_pipeline_select = GEN6_PIPELINE_SELECT_DW0_SELECT_3D;
	/* reuse */
	queue->atomic_bo = bo;

	return XGL_SUCCESS;
	}

	XGL_RESULT intel_queue_create(struct intel_dev *dev,
	enum intel_gpu_engine_type engine,
	struct intel_queue **queue_ret)
	{
	struct intel_queue *queue;
	enum intel_ring_type ring;

	switch (engine) {
	case INTEL_GPU_ENGINE_3D:
	ring = INTEL_RING_RENDER;
	break;
	default:
	return XGL_ERROR_INVALID_VALUE;
	break;
	}

	queue = (struct intel_queue ) intel_base_create(dev, sizeof(queue),
	dev->base.dbg, XGL_DBG_OBJECT_QUEUE, NULL, 0);
	if (!queue)
	return XGL_ERROR_OUT_OF_MEMORY;

	queue->dev = dev;
	queue->ring = ring;

	if (queue_init_hw_and_atomic_bo(queue) != XGL_SUCCESS) {
	intel_queue_destroy(queue);
	return XGL_ERROR_INITIALIZATION_FAILED;
	}

	*queue_ret = queue;

	return XGL_SUCCESS;
	}

	void intel_queue_destroy(struct intel_queue *queue)
	{
	if (queue->atomic_bo)
	intel_bo_unreference(queue->atomic_bo);
	if (queue->select_graphics_bo)
	intel_bo_unreference(queue->select_graphics_bo);
	if (queue->select_compute_bo)
	intel_bo_unreference(queue->select_compute_bo);
	intel_base_destroy(&queue->base);
	}

	XGL_RESULT intel_queue_wait(struct intel_queue *queue, int64_t timeout)
	{
	struct intel_bo *bo = (queue->last_submitted_cmd) ?
	intel_cmd_get_batch(queue->last_submitted_cmd, NULL) : NULL;

	return (!bo \|\| intel_bo_wait(bo, timeout) == 0) ?
	XGL_SUCCESS : XGL_ERROR_UNKNOWN;
	}

	XGL_RESULT XGLAPI intelQueueSetGlobalMemReferences(
	XGL_QUEUE queue,
	XGL_UINT memRefCount,
	const XGL_MEMORY_REF* pMemRefs)
	{
	/*
	* The winwys maintains the list of memory references. These are ignored
	* until we move away from the winsys.
	*/
	return XGL_SUCCESS;
	}

	XGL_RESULT XGLAPI intelQueueWaitIdle(
	XGL_QUEUE queue_)
	{
	struct intel_queue *queue = intel_queue(queue_);

	return intel_queue_wait(queue, -1);
	}

	XGL_RESULT XGLAPI intelQueueSubmit(
	XGL_QUEUE queue_,
	XGL_UINT cmdBufferCount,
	const XGL_CMD_BUFFER* pCmdBuffers,
	XGL_UINT memRefCount,
	const XGL_MEMORY_REF* pMemRefs,
	XGL_FENCE fence_)
	{
	struct intel_queue *queue = intel_queue(queue_);
	XGL_RESULT ret = XGL_SUCCESS;
	XGL_UINT i;

	for (i = 0; i < cmdBufferCount; i++) {
	struct intel_cmd *cmd = intel_cmd(pCmdBuffers[i]);
	struct intel_bo *bo;
	XGL_GPU_SIZE used;
	XGL_RESULT ret;

	ret = queue_select_pipeline(queue, cmd->pipeline_select);
	if (ret != XGL_SUCCESS)
	break;

	bo = intel_cmd_get_batch(cmd, &used);
	ret = queue_submit_bo(queue, bo, used);
	queue->last_submitted_cmd = cmd;

	if (intel_debug & INTEL_DEBUG_BATCH)
	intel_cmd_decode(cmd);

	if (ret != XGL_SUCCESS)
	break;
	}

	if (ret == XGL_SUCCESS && fence_ != XGL_NULL_HANDLE) {
	struct intel_fence *fence = intel_fence(fence_);
	intel_fence_set_cmd(fence, queue->last_submitted_cmd);
	}

	/* XGL_MEMORY_REFs are ignored as the winsys already knows them */

	return ret;
	}

	XGL_RESULT XGLAPI intelOpenSharedQueueSemaphore(
	XGL_DEVICE device,
	const XGL_QUEUE_SEMAPHORE_OPEN_INFO* pOpenInfo,
	XGL_QUEUE_SEMAPHORE* pSemaphore)
	{
	return XGL_ERROR_UNAVAILABLE;
	}

	XGL_RESULT XGLAPI intelCreateQueueSemaphore(
	XGL_DEVICE device,
	const XGL_QUEUE_SEMAPHORE_CREATE_INFO* pCreateInfo,
	XGL_QUEUE_SEMAPHORE* pSemaphore)
	{
	/*
	* We want to find an unused semaphore register and initialize it. Signal
	* will increment the register. Wait will atomically decrement it and
	* block if the value is zero, or a large constant N if we do not want to
	* go negative.
	*
	* XXX However, MI_SEMAPHORE_MBOX does not seem to have the flexibility.
	*/
	return XGL_ERROR_UNAVAILABLE;
	}

	XGL_RESULT XGLAPI intelSignalQueueSemaphore(
	XGL_QUEUE queue,
	XGL_QUEUE_SEMAPHORE semaphore)
	{
	return XGL_ERROR_UNAVAILABLE;
	}

	XGL_RESULT XGLAPI intelWaitQueueSemaphore(
	XGL_QUEUE queue,
	XGL_QUEUE_SEMAPHORE semaphore)
	{
	return XGL_ERROR_UNAVAILABLE;
	}