Chunming Zhou | f556cb0c | 2015-08-02 11:18:04 +0800 | [diff] [blame] | 1 | /* |
| 2 | * Copyright 2015 Advanced Micro Devices, Inc. |
| 3 | * |
| 4 | * Permission is hereby granted, free of charge, to any person obtaining a |
| 5 | * copy of this software and associated documentation files (the "Software"), |
| 6 | * to deal in the Software without restriction, including without limitation |
| 7 | * the rights to use, copy, modify, merge, publish, distribute, sublicense, |
| 8 | * and/or sell copies of the Software, and to permit persons to whom the |
| 9 | * Software is furnished to do so, subject to the following conditions: |
| 10 | * |
| 11 | * The above copyright notice and this permission notice shall be included in |
| 12 | * all copies or substantial portions of the Software. |
| 13 | * |
| 14 | * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR |
| 15 | * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, |
| 16 | * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL |
| 17 | * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR |
| 18 | * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, |
| 19 | * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR |
| 20 | * OTHER DEALINGS IN THE SOFTWARE. |
| 21 | * |
| 22 | * |
| 23 | */ |
| 24 | #include <linux/kthread.h> |
| 25 | #include <linux/wait.h> |
| 26 | #include <linux/sched.h> |
| 27 | #include <drm/drmP.h> |
| 28 | #include "gpu_scheduler.h" |
| 29 | |
Christian König | c24784f | 2016-10-28 17:04:07 +0200 | [diff] [blame] | 30 | static struct kmem_cache *sched_fence_slab; |
| 31 | |
| 32 | int amd_sched_fence_slab_init(void) |
| 33 | { |
| 34 | sched_fence_slab = kmem_cache_create( |
| 35 | "amd_sched_fence", sizeof(struct amd_sched_fence), 0, |
| 36 | SLAB_HWCACHE_ALIGN, NULL); |
| 37 | if (!sched_fence_slab) |
| 38 | return -ENOMEM; |
| 39 | |
| 40 | return 0; |
| 41 | } |
| 42 | |
| 43 | void amd_sched_fence_slab_fini(void) |
| 44 | { |
| 45 | rcu_barrier(); |
| 46 | kmem_cache_destroy(sched_fence_slab); |
| 47 | } |
| 48 | |
Christian König | 16a7133 | 2016-05-18 09:43:07 +0200 | [diff] [blame] | 49 | struct amd_sched_fence *amd_sched_fence_create(struct amd_sched_entity *entity, |
| 50 | void *owner) |
Chunming Zhou | f556cb0c | 2015-08-02 11:18:04 +0800 | [diff] [blame] | 51 | { |
| 52 | struct amd_sched_fence *fence = NULL; |
Christian König | ce882e6 | 2015-08-19 15:00:55 +0200 | [diff] [blame] | 53 | unsigned seq; |
| 54 | |
Chunming Zhou | f5617f9 | 2015-11-05 11:41:50 +0800 | [diff] [blame] | 55 | fence = kmem_cache_zalloc(sched_fence_slab, GFP_KERNEL); |
Chunming Zhou | f556cb0c | 2015-08-02 11:18:04 +0800 | [diff] [blame] | 56 | if (fence == NULL) |
| 57 | return NULL; |
Christian König | 393a0bd | 2015-11-05 12:57:10 +0100 | [diff] [blame] | 58 | |
Chunming Zhou | 84f76ea | 2015-08-24 12:47:36 +0800 | [diff] [blame] | 59 | fence->owner = owner; |
Christian König | 16a7133 | 2016-05-18 09:43:07 +0200 | [diff] [blame] | 60 | fence->sched = entity->sched; |
Chunming Zhou | f556cb0c | 2015-08-02 11:18:04 +0800 | [diff] [blame] | 61 | spin_lock_init(&fence->lock); |
Christian König | ce882e6 | 2015-08-19 15:00:55 +0200 | [diff] [blame] | 62 | |
Christian König | 16a7133 | 2016-05-18 09:43:07 +0200 | [diff] [blame] | 63 | seq = atomic_inc_return(&entity->fence_seq); |
Chris Wilson | f54d186 | 2016-10-25 13:00:45 +0100 | [diff] [blame] | 64 | dma_fence_init(&fence->scheduled, &amd_sched_fence_ops_scheduled, |
| 65 | &fence->lock, entity->fence_context, seq); |
| 66 | dma_fence_init(&fence->finished, &amd_sched_fence_ops_finished, |
| 67 | &fence->lock, entity->fence_context + 1, seq); |
Christian König | ce882e6 | 2015-08-19 15:00:55 +0200 | [diff] [blame] | 68 | |
Chunming Zhou | f556cb0c | 2015-08-02 11:18:04 +0800 | [diff] [blame] | 69 | return fence; |
| 70 | } |
| 71 | |
Christian König | 6fc1367 | 2016-05-20 12:53:52 +0200 | [diff] [blame] | 72 | void amd_sched_fence_scheduled(struct amd_sched_fence *fence) |
Chunming Zhou | f556cb0c | 2015-08-02 11:18:04 +0800 | [diff] [blame] | 73 | { |
Chris Wilson | f54d186 | 2016-10-25 13:00:45 +0100 | [diff] [blame] | 74 | int ret = dma_fence_signal(&fence->scheduled); |
Christian König | 6fc1367 | 2016-05-20 12:53:52 +0200 | [diff] [blame] | 75 | |
Christian König | 2983e5c | 2015-08-10 14:20:55 +0200 | [diff] [blame] | 76 | if (!ret) |
Chris Wilson | f54d186 | 2016-10-25 13:00:45 +0100 | [diff] [blame] | 77 | DMA_FENCE_TRACE(&fence->scheduled, |
| 78 | "signaled from irq context\n"); |
Christian König | 2983e5c | 2015-08-10 14:20:55 +0200 | [diff] [blame] | 79 | else |
Chris Wilson | f54d186 | 2016-10-25 13:00:45 +0100 | [diff] [blame] | 80 | DMA_FENCE_TRACE(&fence->scheduled, |
| 81 | "was already signaled\n"); |
Chunming Zhou | f556cb0c | 2015-08-02 11:18:04 +0800 | [diff] [blame] | 82 | } |
| 83 | |
Christian König | 6fc1367 | 2016-05-20 12:53:52 +0200 | [diff] [blame] | 84 | void amd_sched_fence_finished(struct amd_sched_fence *fence) |
Christian König | 393a0bd | 2015-11-05 12:57:10 +0100 | [diff] [blame] | 85 | { |
Chris Wilson | f54d186 | 2016-10-25 13:00:45 +0100 | [diff] [blame] | 86 | int ret = dma_fence_signal(&fence->finished); |
Christian König | 393a0bd | 2015-11-05 12:57:10 +0100 | [diff] [blame] | 87 | |
Christian König | 6fc1367 | 2016-05-20 12:53:52 +0200 | [diff] [blame] | 88 | if (!ret) |
Chris Wilson | f54d186 | 2016-10-25 13:00:45 +0100 | [diff] [blame] | 89 | DMA_FENCE_TRACE(&fence->finished, |
| 90 | "signaled from irq context\n"); |
Christian König | 6fc1367 | 2016-05-20 12:53:52 +0200 | [diff] [blame] | 91 | else |
Chris Wilson | f54d186 | 2016-10-25 13:00:45 +0100 | [diff] [blame] | 92 | DMA_FENCE_TRACE(&fence->finished, |
| 93 | "was already signaled\n"); |
Christian König | 393a0bd | 2015-11-05 12:57:10 +0100 | [diff] [blame] | 94 | } |
| 95 | |
Chris Wilson | f54d186 | 2016-10-25 13:00:45 +0100 | [diff] [blame] | 96 | static const char *amd_sched_fence_get_driver_name(struct dma_fence *fence) |
Chunming Zhou | f556cb0c | 2015-08-02 11:18:04 +0800 | [diff] [blame] | 97 | { |
| 98 | return "amd_sched"; |
| 99 | } |
| 100 | |
Chris Wilson | f54d186 | 2016-10-25 13:00:45 +0100 | [diff] [blame] | 101 | static const char *amd_sched_fence_get_timeline_name(struct dma_fence *f) |
Chunming Zhou | f556cb0c | 2015-08-02 11:18:04 +0800 | [diff] [blame] | 102 | { |
| 103 | struct amd_sched_fence *fence = to_amd_sched_fence(f); |
Christian König | 9b398fa | 2015-09-07 18:16:49 +0200 | [diff] [blame] | 104 | return (const char *)fence->sched->name; |
Chunming Zhou | f556cb0c | 2015-08-02 11:18:04 +0800 | [diff] [blame] | 105 | } |
| 106 | |
Chris Wilson | f54d186 | 2016-10-25 13:00:45 +0100 | [diff] [blame] | 107 | static bool amd_sched_fence_enable_signaling(struct dma_fence *f) |
Chunming Zhou | f556cb0c | 2015-08-02 11:18:04 +0800 | [diff] [blame] | 108 | { |
Christian König | 2983e5c | 2015-08-10 14:20:55 +0200 | [diff] [blame] | 109 | return true; |
Chunming Zhou | f556cb0c | 2015-08-02 11:18:04 +0800 | [diff] [blame] | 110 | } |
| 111 | |
Christian König | 189e0fb | 2016-03-15 13:58:14 +0100 | [diff] [blame] | 112 | /** |
| 113 | * amd_sched_fence_free - free up the fence memory |
| 114 | * |
| 115 | * @rcu: RCU callback head |
| 116 | * |
| 117 | * Free up the fence memory after the RCU grace period. |
| 118 | */ |
| 119 | static void amd_sched_fence_free(struct rcu_head *rcu) |
Chunming Zhou | f5617f9 | 2015-11-05 11:41:50 +0800 | [diff] [blame] | 120 | { |
Chris Wilson | f54d186 | 2016-10-25 13:00:45 +0100 | [diff] [blame] | 121 | struct dma_fence *f = container_of(rcu, struct dma_fence, rcu); |
Chunming Zhou | f5617f9 | 2015-11-05 11:41:50 +0800 | [diff] [blame] | 122 | struct amd_sched_fence *fence = to_amd_sched_fence(f); |
Christian König | 6fc1367 | 2016-05-20 12:53:52 +0200 | [diff] [blame] | 123 | |
Chris Wilson | f54d186 | 2016-10-25 13:00:45 +0100 | [diff] [blame] | 124 | dma_fence_put(fence->parent); |
Chunming Zhou | f5617f9 | 2015-11-05 11:41:50 +0800 | [diff] [blame] | 125 | kmem_cache_free(sched_fence_slab, fence); |
| 126 | } |
| 127 | |
Christian König | 189e0fb | 2016-03-15 13:58:14 +0100 | [diff] [blame] | 128 | /** |
Grazvydas Ignotas | 9566213 | 2016-10-23 21:31:47 +0300 | [diff] [blame] | 129 | * amd_sched_fence_release_scheduled - callback that fence can be freed |
Christian König | 189e0fb | 2016-03-15 13:58:14 +0100 | [diff] [blame] | 130 | * |
| 131 | * @fence: fence |
| 132 | * |
| 133 | * This function is called when the reference count becomes zero. |
| 134 | * It just RCU schedules freeing up the fence. |
| 135 | */ |
Chris Wilson | f54d186 | 2016-10-25 13:00:45 +0100 | [diff] [blame] | 136 | static void amd_sched_fence_release_scheduled(struct dma_fence *f) |
Christian König | 189e0fb | 2016-03-15 13:58:14 +0100 | [diff] [blame] | 137 | { |
Christian König | 6fc1367 | 2016-05-20 12:53:52 +0200 | [diff] [blame] | 138 | struct amd_sched_fence *fence = to_amd_sched_fence(f); |
| 139 | |
| 140 | call_rcu(&fence->finished.rcu, amd_sched_fence_free); |
Christian König | 189e0fb | 2016-03-15 13:58:14 +0100 | [diff] [blame] | 141 | } |
| 142 | |
Christian König | 6fc1367 | 2016-05-20 12:53:52 +0200 | [diff] [blame] | 143 | /** |
Grazvydas Ignotas | 9566213 | 2016-10-23 21:31:47 +0300 | [diff] [blame] | 144 | * amd_sched_fence_release_finished - drop extra reference |
Christian König | 6fc1367 | 2016-05-20 12:53:52 +0200 | [diff] [blame] | 145 | * |
| 146 | * @f: fence |
| 147 | * |
| 148 | * Drop the extra reference from the scheduled fence to the base fence. |
| 149 | */ |
Chris Wilson | f54d186 | 2016-10-25 13:00:45 +0100 | [diff] [blame] | 150 | static void amd_sched_fence_release_finished(struct dma_fence *f) |
Christian König | 6fc1367 | 2016-05-20 12:53:52 +0200 | [diff] [blame] | 151 | { |
| 152 | struct amd_sched_fence *fence = to_amd_sched_fence(f); |
| 153 | |
Chris Wilson | f54d186 | 2016-10-25 13:00:45 +0100 | [diff] [blame] | 154 | dma_fence_put(&fence->scheduled); |
Christian König | 6fc1367 | 2016-05-20 12:53:52 +0200 | [diff] [blame] | 155 | } |
| 156 | |
Chris Wilson | f54d186 | 2016-10-25 13:00:45 +0100 | [diff] [blame] | 157 | const struct dma_fence_ops amd_sched_fence_ops_scheduled = { |
Chunming Zhou | f556cb0c | 2015-08-02 11:18:04 +0800 | [diff] [blame] | 158 | .get_driver_name = amd_sched_fence_get_driver_name, |
| 159 | .get_timeline_name = amd_sched_fence_get_timeline_name, |
| 160 | .enable_signaling = amd_sched_fence_enable_signaling, |
Christian König | 2983e5c | 2015-08-10 14:20:55 +0200 | [diff] [blame] | 161 | .signaled = NULL, |
Chris Wilson | f54d186 | 2016-10-25 13:00:45 +0100 | [diff] [blame] | 162 | .wait = dma_fence_default_wait, |
Christian König | 6fc1367 | 2016-05-20 12:53:52 +0200 | [diff] [blame] | 163 | .release = amd_sched_fence_release_scheduled, |
| 164 | }; |
| 165 | |
Chris Wilson | f54d186 | 2016-10-25 13:00:45 +0100 | [diff] [blame] | 166 | const struct dma_fence_ops amd_sched_fence_ops_finished = { |
Christian König | 6fc1367 | 2016-05-20 12:53:52 +0200 | [diff] [blame] | 167 | .get_driver_name = amd_sched_fence_get_driver_name, |
| 168 | .get_timeline_name = amd_sched_fence_get_timeline_name, |
| 169 | .enable_signaling = amd_sched_fence_enable_signaling, |
| 170 | .signaled = NULL, |
Chris Wilson | f54d186 | 2016-10-25 13:00:45 +0100 | [diff] [blame] | 171 | .wait = dma_fence_default_wait, |
Christian König | 6fc1367 | 2016-05-20 12:53:52 +0200 | [diff] [blame] | 172 | .release = amd_sched_fence_release_finished, |
Chunming Zhou | f556cb0c | 2015-08-02 11:18:04 +0800 | [diff] [blame] | 173 | }; |