blob: 17c59d839e6faae9dc68ca062190c5608031a1fc [file] [log] [blame]
Jordan Crouse2002c9c2017-03-07 09:50:27 -07001/* Copyright (c) 2016-2017 The Linux Foundation. All rights reserved.
Jordan Crouseb5f103a2016-11-28 12:28:33 -07002 *
3 * This program is free software; you can redistribute it and/or modify
4 * it under the terms of the GNU General Public License version 2 and
5 * only version 2 as published by the Free Software Foundation.
6 *
7 * This program is distributed in the hope that it will be useful,
8 * but WITHOUT ANY WARRANTY; without even the implied warranty of
9 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
10 * GNU General Public License for more details.
11 *
12 */
13
Jordan Crouse7c658172017-05-17 08:45:29 -060014#include <linux/types.h>
15#include <linux/cpumask.h>
16#include <linux/qcom_scm.h>
17#include <linux/dma-mapping.h>
Arnd Bergmann8f93e042017-07-26 21:59:21 +020018#include <linux/of_address.h>
Jordan Crouse7c658172017-05-17 08:45:29 -060019#include <linux/soc/qcom/mdt_loader.h>
Jordan Crouseb5f103a2016-11-28 12:28:33 -070020#include "msm_gem.h"
Rob Clark7f8036b2016-12-07 11:13:53 -050021#include "msm_mmu.h"
Jordan Crouseb5f103a2016-11-28 12:28:33 -070022#include "a5xx_gpu.h"
23
24extern bool hang_debug;
25static void a5xx_dump(struct msm_gpu *gpu);
26
Jordan Crouse7c658172017-05-17 08:45:29 -060027#define GPU_PAS_ID 13
28
Jordan Crouse7c658172017-05-17 08:45:29 -060029static int zap_shader_load_mdt(struct device *dev, const char *fwname)
30{
31 const struct firmware *fw;
Arnd Bergmann8f93e042017-07-26 21:59:21 +020032 struct device_node *np;
33 struct resource r;
Jordan Crouse7c658172017-05-17 08:45:29 -060034 phys_addr_t mem_phys;
35 ssize_t mem_size;
36 void *mem_region = NULL;
37 int ret;
38
Arnd Bergmannbdab8e82017-07-26 17:52:44 +020039 if (!IS_ENABLED(CONFIG_ARCH_QCOM))
40 return -EINVAL;
41
Arnd Bergmann8f93e042017-07-26 21:59:21 +020042 np = of_get_child_by_name(dev->of_node, "zap-shader");
43 if (!np)
44 return -ENODEV;
45
46 np = of_parse_phandle(np, "memory-region", 0);
47 if (!np)
48 return -EINVAL;
49
50 ret = of_address_to_resource(np, 0, &r);
51 if (ret)
52 return ret;
53
54 mem_phys = r.start;
55 mem_size = resource_size(&r);
56
Jordan Crouse7c658172017-05-17 08:45:29 -060057 /* Request the MDT file for the firmware */
58 ret = request_firmware(&fw, fwname, dev);
59 if (ret) {
60 DRM_DEV_ERROR(dev, "Unable to load %s\n", fwname);
61 return ret;
62 }
63
64 /* Figure out how much memory we need */
65 mem_size = qcom_mdt_get_size(fw);
66 if (mem_size < 0) {
67 ret = mem_size;
68 goto out;
69 }
70
71 /* Allocate memory for the firmware image */
Arnd Bergmann8f93e042017-07-26 21:59:21 +020072 mem_region = memremap(mem_phys, mem_size, MEMREMAP_WC);
Jordan Crouse7c658172017-05-17 08:45:29 -060073 if (!mem_region) {
74 ret = -ENOMEM;
75 goto out;
76 }
77
78 /* Load the rest of the MDT */
79 ret = qcom_mdt_load(dev, fw, fwname, GPU_PAS_ID, mem_region, mem_phys,
80 mem_size);
81 if (ret)
82 goto out;
83
84 /* Send the image to the secure world */
85 ret = qcom_scm_pas_auth_and_reset(GPU_PAS_ID);
86 if (ret)
87 DRM_DEV_ERROR(dev, "Unable to authorize the image\n");
88
89out:
Arnd Bergmann8f93e042017-07-26 21:59:21 +020090 if (mem_region)
91 memunmap(mem_region);
92
Jordan Crouse7c658172017-05-17 08:45:29 -060093 release_firmware(fw);
94
95 return ret;
96}
Jordan Crouse7c658172017-05-17 08:45:29 -060097
Jordan Crouseb5f103a2016-11-28 12:28:33 -070098static void a5xx_submit(struct msm_gpu *gpu, struct msm_gem_submit *submit,
99 struct msm_file_private *ctx)
100{
101 struct adreno_gpu *adreno_gpu = to_adreno_gpu(gpu);
102 struct msm_drm_private *priv = gpu->dev->dev_private;
103 struct msm_ringbuffer *ring = gpu->rb;
104 unsigned int i, ibs = 0;
105
106 for (i = 0; i < submit->nr_cmds; i++) {
107 switch (submit->cmd[i].type) {
108 case MSM_SUBMIT_CMD_IB_TARGET_BUF:
109 break;
110 case MSM_SUBMIT_CMD_CTX_RESTORE_BUF:
111 if (priv->lastctx == ctx)
112 break;
113 case MSM_SUBMIT_CMD_BUF:
114 OUT_PKT7(ring, CP_INDIRECT_BUFFER_PFE, 3);
115 OUT_RING(ring, lower_32_bits(submit->cmd[i].iova));
116 OUT_RING(ring, upper_32_bits(submit->cmd[i].iova));
117 OUT_RING(ring, submit->cmd[i].size);
118 ibs++;
119 break;
120 }
121 }
122
123 OUT_PKT4(ring, REG_A5XX_CP_SCRATCH_REG(2), 1);
124 OUT_RING(ring, submit->fence->seqno);
125
126 OUT_PKT7(ring, CP_EVENT_WRITE, 4);
127 OUT_RING(ring, CACHE_FLUSH_TS | (1 << 31));
128 OUT_RING(ring, lower_32_bits(rbmemptr(adreno_gpu, fence)));
129 OUT_RING(ring, upper_32_bits(rbmemptr(adreno_gpu, fence)));
130 OUT_RING(ring, submit->fence->seqno);
131
132 gpu->funcs->flush(gpu);
133}
134
Jordan Crouse6e749e52017-07-27 10:42:31 -0600135static const struct {
Jordan Crouseb5f103a2016-11-28 12:28:33 -0700136 u32 offset;
137 u32 value;
Jordan Crouse6e749e52017-07-27 10:42:31 -0600138} a5xx_hwcg[] = {
Jordan Crouseb5f103a2016-11-28 12:28:33 -0700139 {REG_A5XX_RBBM_CLOCK_CNTL_SP0, 0x02222222},
140 {REG_A5XX_RBBM_CLOCK_CNTL_SP1, 0x02222222},
141 {REG_A5XX_RBBM_CLOCK_CNTL_SP2, 0x02222222},
142 {REG_A5XX_RBBM_CLOCK_CNTL_SP3, 0x02222222},
143 {REG_A5XX_RBBM_CLOCK_CNTL2_SP0, 0x02222220},
144 {REG_A5XX_RBBM_CLOCK_CNTL2_SP1, 0x02222220},
145 {REG_A5XX_RBBM_CLOCK_CNTL2_SP2, 0x02222220},
146 {REG_A5XX_RBBM_CLOCK_CNTL2_SP3, 0x02222220},
147 {REG_A5XX_RBBM_CLOCK_HYST_SP0, 0x0000F3CF},
148 {REG_A5XX_RBBM_CLOCK_HYST_SP1, 0x0000F3CF},
149 {REG_A5XX_RBBM_CLOCK_HYST_SP2, 0x0000F3CF},
150 {REG_A5XX_RBBM_CLOCK_HYST_SP3, 0x0000F3CF},
151 {REG_A5XX_RBBM_CLOCK_DELAY_SP0, 0x00000080},
152 {REG_A5XX_RBBM_CLOCK_DELAY_SP1, 0x00000080},
153 {REG_A5XX_RBBM_CLOCK_DELAY_SP2, 0x00000080},
154 {REG_A5XX_RBBM_CLOCK_DELAY_SP3, 0x00000080},
155 {REG_A5XX_RBBM_CLOCK_CNTL_TP0, 0x22222222},
156 {REG_A5XX_RBBM_CLOCK_CNTL_TP1, 0x22222222},
157 {REG_A5XX_RBBM_CLOCK_CNTL_TP2, 0x22222222},
158 {REG_A5XX_RBBM_CLOCK_CNTL_TP3, 0x22222222},
159 {REG_A5XX_RBBM_CLOCK_CNTL2_TP0, 0x22222222},
160 {REG_A5XX_RBBM_CLOCK_CNTL2_TP1, 0x22222222},
161 {REG_A5XX_RBBM_CLOCK_CNTL2_TP2, 0x22222222},
162 {REG_A5XX_RBBM_CLOCK_CNTL2_TP3, 0x22222222},
163 {REG_A5XX_RBBM_CLOCK_CNTL3_TP0, 0x00002222},
164 {REG_A5XX_RBBM_CLOCK_CNTL3_TP1, 0x00002222},
165 {REG_A5XX_RBBM_CLOCK_CNTL3_TP2, 0x00002222},
166 {REG_A5XX_RBBM_CLOCK_CNTL3_TP3, 0x00002222},
167 {REG_A5XX_RBBM_CLOCK_HYST_TP0, 0x77777777},
168 {REG_A5XX_RBBM_CLOCK_HYST_TP1, 0x77777777},
169 {REG_A5XX_RBBM_CLOCK_HYST_TP2, 0x77777777},
170 {REG_A5XX_RBBM_CLOCK_HYST_TP3, 0x77777777},
171 {REG_A5XX_RBBM_CLOCK_HYST2_TP0, 0x77777777},
172 {REG_A5XX_RBBM_CLOCK_HYST2_TP1, 0x77777777},
173 {REG_A5XX_RBBM_CLOCK_HYST2_TP2, 0x77777777},
174 {REG_A5XX_RBBM_CLOCK_HYST2_TP3, 0x77777777},
175 {REG_A5XX_RBBM_CLOCK_HYST3_TP0, 0x00007777},
176 {REG_A5XX_RBBM_CLOCK_HYST3_TP1, 0x00007777},
177 {REG_A5XX_RBBM_CLOCK_HYST3_TP2, 0x00007777},
178 {REG_A5XX_RBBM_CLOCK_HYST3_TP3, 0x00007777},
179 {REG_A5XX_RBBM_CLOCK_DELAY_TP0, 0x11111111},
180 {REG_A5XX_RBBM_CLOCK_DELAY_TP1, 0x11111111},
181 {REG_A5XX_RBBM_CLOCK_DELAY_TP2, 0x11111111},
182 {REG_A5XX_RBBM_CLOCK_DELAY_TP3, 0x11111111},
183 {REG_A5XX_RBBM_CLOCK_DELAY2_TP0, 0x11111111},
184 {REG_A5XX_RBBM_CLOCK_DELAY2_TP1, 0x11111111},
185 {REG_A5XX_RBBM_CLOCK_DELAY2_TP2, 0x11111111},
186 {REG_A5XX_RBBM_CLOCK_DELAY2_TP3, 0x11111111},
187 {REG_A5XX_RBBM_CLOCK_DELAY3_TP0, 0x00001111},
188 {REG_A5XX_RBBM_CLOCK_DELAY3_TP1, 0x00001111},
189 {REG_A5XX_RBBM_CLOCK_DELAY3_TP2, 0x00001111},
190 {REG_A5XX_RBBM_CLOCK_DELAY3_TP3, 0x00001111},
191 {REG_A5XX_RBBM_CLOCK_CNTL_UCHE, 0x22222222},
192 {REG_A5XX_RBBM_CLOCK_CNTL2_UCHE, 0x22222222},
193 {REG_A5XX_RBBM_CLOCK_CNTL3_UCHE, 0x22222222},
194 {REG_A5XX_RBBM_CLOCK_CNTL4_UCHE, 0x00222222},
195 {REG_A5XX_RBBM_CLOCK_HYST_UCHE, 0x00444444},
196 {REG_A5XX_RBBM_CLOCK_DELAY_UCHE, 0x00000002},
197 {REG_A5XX_RBBM_CLOCK_CNTL_RB0, 0x22222222},
198 {REG_A5XX_RBBM_CLOCK_CNTL_RB1, 0x22222222},
199 {REG_A5XX_RBBM_CLOCK_CNTL_RB2, 0x22222222},
200 {REG_A5XX_RBBM_CLOCK_CNTL_RB3, 0x22222222},
201 {REG_A5XX_RBBM_CLOCK_CNTL2_RB0, 0x00222222},
202 {REG_A5XX_RBBM_CLOCK_CNTL2_RB1, 0x00222222},
203 {REG_A5XX_RBBM_CLOCK_CNTL2_RB2, 0x00222222},
204 {REG_A5XX_RBBM_CLOCK_CNTL2_RB3, 0x00222222},
205 {REG_A5XX_RBBM_CLOCK_CNTL_CCU0, 0x00022220},
206 {REG_A5XX_RBBM_CLOCK_CNTL_CCU1, 0x00022220},
207 {REG_A5XX_RBBM_CLOCK_CNTL_CCU2, 0x00022220},
208 {REG_A5XX_RBBM_CLOCK_CNTL_CCU3, 0x00022220},
209 {REG_A5XX_RBBM_CLOCK_CNTL_RAC, 0x05522222},
210 {REG_A5XX_RBBM_CLOCK_CNTL2_RAC, 0x00505555},
211 {REG_A5XX_RBBM_CLOCK_HYST_RB_CCU0, 0x04040404},
212 {REG_A5XX_RBBM_CLOCK_HYST_RB_CCU1, 0x04040404},
213 {REG_A5XX_RBBM_CLOCK_HYST_RB_CCU2, 0x04040404},
214 {REG_A5XX_RBBM_CLOCK_HYST_RB_CCU3, 0x04040404},
215 {REG_A5XX_RBBM_CLOCK_HYST_RAC, 0x07444044},
216 {REG_A5XX_RBBM_CLOCK_DELAY_RB_CCU_L1_0, 0x00000002},
217 {REG_A5XX_RBBM_CLOCK_DELAY_RB_CCU_L1_1, 0x00000002},
218 {REG_A5XX_RBBM_CLOCK_DELAY_RB_CCU_L1_2, 0x00000002},
219 {REG_A5XX_RBBM_CLOCK_DELAY_RB_CCU_L1_3, 0x00000002},
220 {REG_A5XX_RBBM_CLOCK_DELAY_RAC, 0x00010011},
221 {REG_A5XX_RBBM_CLOCK_CNTL_TSE_RAS_RBBM, 0x04222222},
222 {REG_A5XX_RBBM_CLOCK_MODE_GPC, 0x02222222},
223 {REG_A5XX_RBBM_CLOCK_MODE_VFD, 0x00002222},
224 {REG_A5XX_RBBM_CLOCK_HYST_TSE_RAS_RBBM, 0x00000000},
225 {REG_A5XX_RBBM_CLOCK_HYST_GPC, 0x04104004},
226 {REG_A5XX_RBBM_CLOCK_HYST_VFD, 0x00000000},
227 {REG_A5XX_RBBM_CLOCK_DELAY_HLSQ, 0x00000000},
228 {REG_A5XX_RBBM_CLOCK_DELAY_TSE_RAS_RBBM, 0x00004000},
229 {REG_A5XX_RBBM_CLOCK_DELAY_GPC, 0x00000200},
230 {REG_A5XX_RBBM_CLOCK_DELAY_VFD, 0x00002222}
231};
232
Jordan Crouse6e749e52017-07-27 10:42:31 -0600233void a5xx_set_hwcg(struct msm_gpu *gpu, bool state)
Jordan Crouseb5f103a2016-11-28 12:28:33 -0700234{
235 unsigned int i;
236
Jordan Crouse6e749e52017-07-27 10:42:31 -0600237 for (i = 0; i < ARRAY_SIZE(a5xx_hwcg); i++)
238 gpu_write(gpu, a5xx_hwcg[i].offset,
239 state ? a5xx_hwcg[i].value : 0);
Jordan Crouseb5f103a2016-11-28 12:28:33 -0700240
Jordan Crouse6e749e52017-07-27 10:42:31 -0600241 gpu_write(gpu, REG_A5XX_RBBM_CLOCK_CNTL, state ? 0xAAA8AA00 : 0);
242 gpu_write(gpu, REG_A5XX_RBBM_ISDB_CNT, state ? 0x182 : 0x180);
Jordan Crouseb5f103a2016-11-28 12:28:33 -0700243}
244
245static int a5xx_me_init(struct msm_gpu *gpu)
246{
247 struct adreno_gpu *adreno_gpu = to_adreno_gpu(gpu);
248 struct msm_ringbuffer *ring = gpu->rb;
249
250 OUT_PKT7(ring, CP_ME_INIT, 8);
251
252 OUT_RING(ring, 0x0000002F);
253
254 /* Enable multiple hardware contexts */
255 OUT_RING(ring, 0x00000003);
256
257 /* Enable error detection */
258 OUT_RING(ring, 0x20000000);
259
260 /* Don't enable header dump */
261 OUT_RING(ring, 0x00000000);
262 OUT_RING(ring, 0x00000000);
263
264 /* Specify workarounds for various microcode issues */
265 if (adreno_is_a530(adreno_gpu)) {
266 /* Workaround for token end syncs
267 * Force a WFI after every direct-render 3D mode draw and every
268 * 2D mode 3 draw
269 */
270 OUT_RING(ring, 0x0000000B);
271 } else {
272 /* No workarounds enabled */
273 OUT_RING(ring, 0x00000000);
274 }
275
276 OUT_RING(ring, 0x00000000);
277 OUT_RING(ring, 0x00000000);
278
279 gpu->funcs->flush(gpu);
280
Jordan Crousee895c7b2017-05-08 14:35:00 -0600281 return a5xx_idle(gpu) ? 0 : -EINVAL;
Jordan Crouseb5f103a2016-11-28 12:28:33 -0700282}
283
284static struct drm_gem_object *a5xx_ucode_load_bo(struct msm_gpu *gpu,
285 const struct firmware *fw, u64 *iova)
286{
Jordan Crouseb5f103a2016-11-28 12:28:33 -0700287 struct drm_gem_object *bo;
288 void *ptr;
289
Jordan Crouse82232862017-07-27 10:42:40 -0600290 ptr = msm_gem_kernel_new_locked(gpu->dev, fw->size - 4,
291 MSM_BO_UNCACHED | MSM_BO_GPU_READONLY, gpu->aspace, &bo, iova);
Jordan Crouseb5f103a2016-11-28 12:28:33 -0700292
Jordan Crouse82232862017-07-27 10:42:40 -0600293 if (IS_ERR(ptr))
294 return ERR_CAST(ptr);
Jordan Crouseb5f103a2016-11-28 12:28:33 -0700295
296 memcpy(ptr, &fw->data[4], fw->size - 4);
297
Sushmita Susheelendra0e082702017-06-13 16:52:54 -0600298 msm_gem_put_vaddr(bo);
Jordan Crouseb5f103a2016-11-28 12:28:33 -0700299 return bo;
300}
301
302static int a5xx_ucode_init(struct msm_gpu *gpu)
303{
304 struct adreno_gpu *adreno_gpu = to_adreno_gpu(gpu);
305 struct a5xx_gpu *a5xx_gpu = to_a5xx_gpu(adreno_gpu);
306 int ret;
307
308 if (!a5xx_gpu->pm4_bo) {
309 a5xx_gpu->pm4_bo = a5xx_ucode_load_bo(gpu, adreno_gpu->pm4,
310 &a5xx_gpu->pm4_iova);
311
312 if (IS_ERR(a5xx_gpu->pm4_bo)) {
313 ret = PTR_ERR(a5xx_gpu->pm4_bo);
314 a5xx_gpu->pm4_bo = NULL;
315 dev_err(gpu->dev->dev, "could not allocate PM4: %d\n",
316 ret);
317 return ret;
318 }
319 }
320
321 if (!a5xx_gpu->pfp_bo) {
322 a5xx_gpu->pfp_bo = a5xx_ucode_load_bo(gpu, adreno_gpu->pfp,
323 &a5xx_gpu->pfp_iova);
324
325 if (IS_ERR(a5xx_gpu->pfp_bo)) {
326 ret = PTR_ERR(a5xx_gpu->pfp_bo);
327 a5xx_gpu->pfp_bo = NULL;
328 dev_err(gpu->dev->dev, "could not allocate PFP: %d\n",
329 ret);
330 return ret;
331 }
332 }
333
334 gpu_write64(gpu, REG_A5XX_CP_ME_INSTR_BASE_LO,
335 REG_A5XX_CP_ME_INSTR_BASE_HI, a5xx_gpu->pm4_iova);
336
337 gpu_write64(gpu, REG_A5XX_CP_PFP_INSTR_BASE_LO,
338 REG_A5XX_CP_PFP_INSTR_BASE_HI, a5xx_gpu->pfp_iova);
339
340 return 0;
341}
342
Jordan Crouse7c658172017-05-17 08:45:29 -0600343#define SCM_GPU_ZAP_SHADER_RESUME 0
344
345static int a5xx_zap_shader_resume(struct msm_gpu *gpu)
346{
347 int ret;
348
349 ret = qcom_scm_set_remote_state(SCM_GPU_ZAP_SHADER_RESUME, GPU_PAS_ID);
350 if (ret)
351 DRM_ERROR("%s: zap-shader resume failed: %d\n",
352 gpu->name, ret);
353
354 return ret;
355}
356
Jordan Crouse7c658172017-05-17 08:45:29 -0600357static int a5xx_zap_shader_init(struct msm_gpu *gpu)
358{
359 static bool loaded;
360 struct adreno_gpu *adreno_gpu = to_adreno_gpu(gpu);
Jordan Crouse8d6f0822017-07-27 10:42:33 -0600361 struct platform_device *pdev = gpu->pdev;
Jordan Crouse7c658172017-05-17 08:45:29 -0600362 int ret;
363
364 /*
365 * If the zap shader is already loaded into memory we just need to kick
366 * the remote processor to reinitialize it
367 */
368 if (loaded)
369 return a5xx_zap_shader_resume(gpu);
370
371 /* We need SCM to be able to load the firmware */
372 if (!qcom_scm_is_available()) {
373 DRM_DEV_ERROR(&pdev->dev, "SCM is not available\n");
374 return -EPROBE_DEFER;
375 }
376
377 /* Each GPU has a target specific zap shader firmware name to use */
378 if (!adreno_gpu->info->zapfw) {
379 DRM_DEV_ERROR(&pdev->dev,
380 "Zap shader firmware file not specified for this target\n");
381 return -ENODEV;
382 }
383
Arnd Bergmann8f93e042017-07-26 21:59:21 +0200384 ret = zap_shader_load_mdt(&pdev->dev, adreno_gpu->info->zapfw);
Jordan Crouse7c658172017-05-17 08:45:29 -0600385
386 loaded = !ret;
387
388 return ret;
389}
390
Jordan Crouseb5f103a2016-11-28 12:28:33 -0700391#define A5XX_INT_MASK (A5XX_RBBM_INT_0_MASK_RBBM_AHB_ERROR | \
392 A5XX_RBBM_INT_0_MASK_RBBM_TRANSFER_TIMEOUT | \
393 A5XX_RBBM_INT_0_MASK_RBBM_ME_MS_TIMEOUT | \
394 A5XX_RBBM_INT_0_MASK_RBBM_PFP_MS_TIMEOUT | \
395 A5XX_RBBM_INT_0_MASK_RBBM_ETS_MS_TIMEOUT | \
396 A5XX_RBBM_INT_0_MASK_RBBM_ATB_ASYNC_OVERFLOW | \
397 A5XX_RBBM_INT_0_MASK_CP_HW_ERROR | \
Jordan Crouseac1b5ab2017-07-27 10:42:36 -0600398 A5XX_RBBM_INT_0_MASK_MISC_HANG_DETECT | \
Jordan Crouseb5f103a2016-11-28 12:28:33 -0700399 A5XX_RBBM_INT_0_MASK_CP_CACHE_FLUSH_TS | \
400 A5XX_RBBM_INT_0_MASK_UCHE_OOB_ACCESS | \
401 A5XX_RBBM_INT_0_MASK_GPMU_VOLTAGE_DROOP)
402
403static int a5xx_hw_init(struct msm_gpu *gpu)
404{
405 struct adreno_gpu *adreno_gpu = to_adreno_gpu(gpu);
406 int ret;
407
408 gpu_write(gpu, REG_A5XX_VBIF_ROUND_ROBIN_QOS_ARB, 0x00000003);
409
410 /* Make all blocks contribute to the GPU BUSY perf counter */
411 gpu_write(gpu, REG_A5XX_RBBM_PERFCTR_GPU_BUSY_MASKED, 0xFFFFFFFF);
412
413 /* Enable RBBM error reporting bits */
414 gpu_write(gpu, REG_A5XX_RBBM_AHB_CNTL0, 0x00000001);
415
Rob Clark4e09b952017-01-30 11:15:14 -0500416 if (adreno_gpu->info->quirks & ADRENO_QUIRK_FAULT_DETECT_MASK) {
Jordan Crouseb5f103a2016-11-28 12:28:33 -0700417 /*
418 * Mask out the activity signals from RB1-3 to avoid false
419 * positives
420 */
421
422 gpu_write(gpu, REG_A5XX_RBBM_INTERFACE_HANG_MASK_CNTL11,
423 0xF0000000);
424 gpu_write(gpu, REG_A5XX_RBBM_INTERFACE_HANG_MASK_CNTL12,
425 0xFFFFFFFF);
426 gpu_write(gpu, REG_A5XX_RBBM_INTERFACE_HANG_MASK_CNTL13,
427 0xFFFFFFFF);
428 gpu_write(gpu, REG_A5XX_RBBM_INTERFACE_HANG_MASK_CNTL14,
429 0xFFFFFFFF);
430 gpu_write(gpu, REG_A5XX_RBBM_INTERFACE_HANG_MASK_CNTL15,
431 0xFFFFFFFF);
432 gpu_write(gpu, REG_A5XX_RBBM_INTERFACE_HANG_MASK_CNTL16,
433 0xFFFFFFFF);
434 gpu_write(gpu, REG_A5XX_RBBM_INTERFACE_HANG_MASK_CNTL17,
435 0xFFFFFFFF);
436 gpu_write(gpu, REG_A5XX_RBBM_INTERFACE_HANG_MASK_CNTL18,
437 0xFFFFFFFF);
438 }
439
440 /* Enable fault detection */
441 gpu_write(gpu, REG_A5XX_RBBM_INTERFACE_HANG_INT_CNTL,
442 (1 << 30) | 0xFFFF);
443
444 /* Turn on performance counters */
445 gpu_write(gpu, REG_A5XX_RBBM_PERFCTR_CNTL, 0x01);
446
447 /* Increase VFD cache access so LRZ and other data gets evicted less */
448 gpu_write(gpu, REG_A5XX_UCHE_CACHE_WAYS, 0x02);
449
450 /* Disable L2 bypass in the UCHE */
451 gpu_write(gpu, REG_A5XX_UCHE_TRAP_BASE_LO, 0xFFFF0000);
452 gpu_write(gpu, REG_A5XX_UCHE_TRAP_BASE_HI, 0x0001FFFF);
453 gpu_write(gpu, REG_A5XX_UCHE_WRITE_THRU_BASE_LO, 0xFFFF0000);
454 gpu_write(gpu, REG_A5XX_UCHE_WRITE_THRU_BASE_HI, 0x0001FFFF);
455
456 /* Set the GMEM VA range (0 to gpu->gmem) */
457 gpu_write(gpu, REG_A5XX_UCHE_GMEM_RANGE_MIN_LO, 0x00100000);
458 gpu_write(gpu, REG_A5XX_UCHE_GMEM_RANGE_MIN_HI, 0x00000000);
459 gpu_write(gpu, REG_A5XX_UCHE_GMEM_RANGE_MAX_LO,
460 0x00100000 + adreno_gpu->gmem - 1);
461 gpu_write(gpu, REG_A5XX_UCHE_GMEM_RANGE_MAX_HI, 0x00000000);
462
463 gpu_write(gpu, REG_A5XX_CP_MEQ_THRESHOLDS, 0x40);
464 gpu_write(gpu, REG_A5XX_CP_MERCIU_SIZE, 0x40);
465 gpu_write(gpu, REG_A5XX_CP_ROQ_THRESHOLDS_2, 0x80000060);
466 gpu_write(gpu, REG_A5XX_CP_ROQ_THRESHOLDS_1, 0x40201B16);
467
468 gpu_write(gpu, REG_A5XX_PC_DBG_ECO_CNTL, (0x400 << 11 | 0x300 << 22));
469
Rob Clark4e09b952017-01-30 11:15:14 -0500470 if (adreno_gpu->info->quirks & ADRENO_QUIRK_TWO_PASS_USE_WFI)
Jordan Crouseb5f103a2016-11-28 12:28:33 -0700471 gpu_rmw(gpu, REG_A5XX_PC_DBG_ECO_CNTL, 0, (1 << 8));
472
473 gpu_write(gpu, REG_A5XX_PC_DBG_ECO_CNTL, 0xc0200100);
474
475 /* Enable USE_RETENTION_FLOPS */
476 gpu_write(gpu, REG_A5XX_CP_CHICKEN_DBG, 0x02000000);
477
478 /* Enable ME/PFP split notification */
479 gpu_write(gpu, REG_A5XX_RBBM_AHB_CNTL1, 0xA6FFFFFF);
480
481 /* Enable HWCG */
Jordan Crouse6e749e52017-07-27 10:42:31 -0600482 a5xx_set_hwcg(gpu, true);
Jordan Crouseb5f103a2016-11-28 12:28:33 -0700483
484 gpu_write(gpu, REG_A5XX_RBBM_AHB_CNTL2, 0x0000003F);
485
486 /* Set the highest bank bit */
487 gpu_write(gpu, REG_A5XX_TPL1_MODE_CNTL, 2 << 7);
488 gpu_write(gpu, REG_A5XX_RB_MODE_CNTL, 2 << 1);
489
490 /* Protect registers from the CP */
491 gpu_write(gpu, REG_A5XX_CP_PROTECT_CNTL, 0x00000007);
492
493 /* RBBM */
494 gpu_write(gpu, REG_A5XX_CP_PROTECT(0), ADRENO_PROTECT_RW(0x04, 4));
495 gpu_write(gpu, REG_A5XX_CP_PROTECT(1), ADRENO_PROTECT_RW(0x08, 8));
496 gpu_write(gpu, REG_A5XX_CP_PROTECT(2), ADRENO_PROTECT_RW(0x10, 16));
497 gpu_write(gpu, REG_A5XX_CP_PROTECT(3), ADRENO_PROTECT_RW(0x20, 32));
498 gpu_write(gpu, REG_A5XX_CP_PROTECT(4), ADRENO_PROTECT_RW(0x40, 64));
499 gpu_write(gpu, REG_A5XX_CP_PROTECT(5), ADRENO_PROTECT_RW(0x80, 64));
500
501 /* Content protect */
502 gpu_write(gpu, REG_A5XX_CP_PROTECT(6),
503 ADRENO_PROTECT_RW(REG_A5XX_RBBM_SECVID_TSB_TRUSTED_BASE_LO,
504 16));
505 gpu_write(gpu, REG_A5XX_CP_PROTECT(7),
506 ADRENO_PROTECT_RW(REG_A5XX_RBBM_SECVID_TRUST_CNTL, 2));
507
508 /* CP */
509 gpu_write(gpu, REG_A5XX_CP_PROTECT(8), ADRENO_PROTECT_RW(0x800, 64));
510 gpu_write(gpu, REG_A5XX_CP_PROTECT(9), ADRENO_PROTECT_RW(0x840, 8));
511 gpu_write(gpu, REG_A5XX_CP_PROTECT(10), ADRENO_PROTECT_RW(0x880, 32));
512 gpu_write(gpu, REG_A5XX_CP_PROTECT(11), ADRENO_PROTECT_RW(0xAA0, 1));
513
514 /* RB */
515 gpu_write(gpu, REG_A5XX_CP_PROTECT(12), ADRENO_PROTECT_RW(0xCC0, 1));
516 gpu_write(gpu, REG_A5XX_CP_PROTECT(13), ADRENO_PROTECT_RW(0xCF0, 2));
517
518 /* VPC */
519 gpu_write(gpu, REG_A5XX_CP_PROTECT(14), ADRENO_PROTECT_RW(0xE68, 8));
520 gpu_write(gpu, REG_A5XX_CP_PROTECT(15), ADRENO_PROTECT_RW(0xE70, 4));
521
522 /* UCHE */
523 gpu_write(gpu, REG_A5XX_CP_PROTECT(16), ADRENO_PROTECT_RW(0xE80, 16));
524
525 if (adreno_is_a530(adreno_gpu))
526 gpu_write(gpu, REG_A5XX_CP_PROTECT(17),
527 ADRENO_PROTECT_RW(0x10000, 0x8000));
528
529 gpu_write(gpu, REG_A5XX_RBBM_SECVID_TSB_CNTL, 0);
530 /*
531 * Disable the trusted memory range - we don't actually supported secure
532 * memory rendering at this point in time and we don't want to block off
533 * part of the virtual memory space.
534 */
535 gpu_write64(gpu, REG_A5XX_RBBM_SECVID_TSB_TRUSTED_BASE_LO,
536 REG_A5XX_RBBM_SECVID_TSB_TRUSTED_BASE_HI, 0x00000000);
537 gpu_write(gpu, REG_A5XX_RBBM_SECVID_TSB_TRUSTED_SIZE, 0x00000000);
538
Jordan Crouse2401a002016-11-28 12:28:34 -0700539 /* Load the GPMU firmware before starting the HW init */
540 a5xx_gpmu_ucode_init(gpu);
541
Jordan Crouseb5f103a2016-11-28 12:28:33 -0700542 ret = adreno_hw_init(gpu);
543 if (ret)
544 return ret;
545
546 ret = a5xx_ucode_init(gpu);
547 if (ret)
548 return ret;
549
550 /* Disable the interrupts through the initial bringup stage */
551 gpu_write(gpu, REG_A5XX_RBBM_INT_0_MASK, A5XX_INT_MASK);
552
553 /* Clear ME_HALT to start the micro engine */
554 gpu_write(gpu, REG_A5XX_CP_PFP_ME_CNTL, 0);
555 ret = a5xx_me_init(gpu);
556 if (ret)
557 return ret;
558
Jordan Crouse2401a002016-11-28 12:28:34 -0700559 ret = a5xx_power_init(gpu);
560 if (ret)
561 return ret;
Jordan Crouseb5f103a2016-11-28 12:28:33 -0700562
563 /*
564 * Send a pipeline event stat to get misbehaving counters to start
565 * ticking correctly
566 */
567 if (adreno_is_a530(adreno_gpu)) {
568 OUT_PKT7(gpu->rb, CP_EVENT_WRITE, 1);
569 OUT_RING(gpu->rb, 0x0F);
570
571 gpu->funcs->flush(gpu);
Jordan Crousee895c7b2017-05-08 14:35:00 -0600572 if (!a5xx_idle(gpu))
Jordan Crouseb5f103a2016-11-28 12:28:33 -0700573 return -EINVAL;
574 }
575
Jordan Crouse7c658172017-05-17 08:45:29 -0600576 /*
577 * Try to load a zap shader into the secure world. If successful
578 * we can use the CP to switch out of secure mode. If not then we
579 * have no resource but to try to switch ourselves out manually. If we
580 * guessed wrong then access to the RBBM_SECVID_TRUST_CNTL register will
581 * be blocked and a permissions violation will soon follow.
582 */
583 ret = a5xx_zap_shader_init(gpu);
584 if (!ret) {
585 OUT_PKT7(gpu->rb, CP_SET_SECURE_MODE, 1);
586 OUT_RING(gpu->rb, 0x00000000);
587
588 gpu->funcs->flush(gpu);
Jordan Crousee895c7b2017-05-08 14:35:00 -0600589 if (!a5xx_idle(gpu))
Jordan Crouse7c658172017-05-17 08:45:29 -0600590 return -EINVAL;
591 } else {
592 /* Print a warning so if we die, we know why */
593 dev_warn_once(gpu->dev->dev,
594 "Zap shader not enabled - using SECVID_TRUST_CNTL instead\n");
595 gpu_write(gpu, REG_A5XX_RBBM_SECVID_TRUST_CNTL, 0x0);
596 }
Jordan Crouse2401a002016-11-28 12:28:34 -0700597
Jordan Crouseb5f103a2016-11-28 12:28:33 -0700598 return 0;
599}
600
601static void a5xx_recover(struct msm_gpu *gpu)
602{
603 int i;
604
605 adreno_dump_info(gpu);
606
607 for (i = 0; i < 8; i++) {
608 printk("CP_SCRATCH_REG%d: %u\n", i,
609 gpu_read(gpu, REG_A5XX_CP_SCRATCH_REG(i)));
610 }
611
612 if (hang_debug)
613 a5xx_dump(gpu);
614
615 gpu_write(gpu, REG_A5XX_RBBM_SW_RESET_CMD, 1);
616 gpu_read(gpu, REG_A5XX_RBBM_SW_RESET_CMD);
617 gpu_write(gpu, REG_A5XX_RBBM_SW_RESET_CMD, 0);
618 adreno_recover(gpu);
619}
620
621static void a5xx_destroy(struct msm_gpu *gpu)
622{
623 struct adreno_gpu *adreno_gpu = to_adreno_gpu(gpu);
624 struct a5xx_gpu *a5xx_gpu = to_a5xx_gpu(adreno_gpu);
625
626 DBG("%s", gpu->name);
627
628 if (a5xx_gpu->pm4_bo) {
629 if (a5xx_gpu->pm4_iova)
Rob Clark8bdcd942017-06-13 11:07:08 -0400630 msm_gem_put_iova(a5xx_gpu->pm4_bo, gpu->aspace);
Jordan Crouseb5f103a2016-11-28 12:28:33 -0700631 drm_gem_object_unreference_unlocked(a5xx_gpu->pm4_bo);
632 }
633
634 if (a5xx_gpu->pfp_bo) {
635 if (a5xx_gpu->pfp_iova)
Rob Clark8bdcd942017-06-13 11:07:08 -0400636 msm_gem_put_iova(a5xx_gpu->pfp_bo, gpu->aspace);
Jordan Crouseb5f103a2016-11-28 12:28:33 -0700637 drm_gem_object_unreference_unlocked(a5xx_gpu->pfp_bo);
638 }
639
Jordan Crouse2401a002016-11-28 12:28:34 -0700640 if (a5xx_gpu->gpmu_bo) {
Jordan Crouse2002c9c2017-03-07 09:50:27 -0700641 if (a5xx_gpu->gpmu_iova)
Rob Clark8bdcd942017-06-13 11:07:08 -0400642 msm_gem_put_iova(a5xx_gpu->gpmu_bo, gpu->aspace);
Jordan Crouse2401a002016-11-28 12:28:34 -0700643 drm_gem_object_unreference_unlocked(a5xx_gpu->gpmu_bo);
644 }
645
Jordan Crouseb5f103a2016-11-28 12:28:33 -0700646 adreno_gpu_cleanup(adreno_gpu);
647 kfree(a5xx_gpu);
648}
649
650static inline bool _a5xx_check_idle(struct msm_gpu *gpu)
651{
652 if (gpu_read(gpu, REG_A5XX_RBBM_STATUS) & ~A5XX_RBBM_STATUS_HI_BUSY)
653 return false;
654
655 /*
656 * Nearly every abnormality ends up pausing the GPU and triggering a
657 * fault so we can safely just watch for this one interrupt to fire
658 */
659 return !(gpu_read(gpu, REG_A5XX_RBBM_INT_0_STATUS) &
660 A5XX_RBBM_INT_0_MASK_MISC_HANG_DETECT);
661}
662
Jordan Crousee895c7b2017-05-08 14:35:00 -0600663bool a5xx_idle(struct msm_gpu *gpu)
Jordan Crouseb5f103a2016-11-28 12:28:33 -0700664{
665 /* wait for CP to drain ringbuffer: */
666 if (!adreno_idle(gpu))
667 return false;
668
669 if (spin_until(_a5xx_check_idle(gpu))) {
670 DRM_ERROR("%s: %ps: timeout waiting for GPU to idle: status %8.8X irq %8.8X\n",
671 gpu->name, __builtin_return_address(0),
672 gpu_read(gpu, REG_A5XX_RBBM_STATUS),
673 gpu_read(gpu, REG_A5XX_RBBM_INT_0_STATUS));
674
675 return false;
676 }
677
678 return true;
679}
680
Rob Clark7f8036b2016-12-07 11:13:53 -0500681static int a5xx_fault_handler(void *arg, unsigned long iova, int flags)
682{
683 struct msm_gpu *gpu = arg;
684 pr_warn_ratelimited("*** gpu fault: iova=%08lx, flags=%d (%u,%u,%u,%u)\n",
685 iova, flags,
686 gpu_read(gpu, REG_A5XX_CP_SCRATCH_REG(4)),
687 gpu_read(gpu, REG_A5XX_CP_SCRATCH_REG(5)),
688 gpu_read(gpu, REG_A5XX_CP_SCRATCH_REG(6)),
689 gpu_read(gpu, REG_A5XX_CP_SCRATCH_REG(7)));
690
691 return -EFAULT;
692}
693
Jordan Crouseb5f103a2016-11-28 12:28:33 -0700694static void a5xx_cp_err_irq(struct msm_gpu *gpu)
695{
696 u32 status = gpu_read(gpu, REG_A5XX_CP_INTERRUPT_STATUS);
697
698 if (status & A5XX_CP_INT_CP_OPCODE_ERROR) {
699 u32 val;
700
701 gpu_write(gpu, REG_A5XX_CP_PFP_STAT_ADDR, 0);
702
703 /*
704 * REG_A5XX_CP_PFP_STAT_DATA is indexed, and we want index 1 so
705 * read it twice
706 */
707
708 gpu_read(gpu, REG_A5XX_CP_PFP_STAT_DATA);
709 val = gpu_read(gpu, REG_A5XX_CP_PFP_STAT_DATA);
710
711 dev_err_ratelimited(gpu->dev->dev, "CP | opcode error | possible opcode=0x%8.8X\n",
712 val);
713 }
714
715 if (status & A5XX_CP_INT_CP_HW_FAULT_ERROR)
716 dev_err_ratelimited(gpu->dev->dev, "CP | HW fault | status=0x%8.8X\n",
717 gpu_read(gpu, REG_A5XX_CP_HW_FAULT));
718
719 if (status & A5XX_CP_INT_CP_DMA_ERROR)
720 dev_err_ratelimited(gpu->dev->dev, "CP | DMA error\n");
721
722 if (status & A5XX_CP_INT_CP_REGISTER_PROTECTION_ERROR) {
723 u32 val = gpu_read(gpu, REG_A5XX_CP_PROTECT_STATUS);
724
725 dev_err_ratelimited(gpu->dev->dev,
726 "CP | protected mode error | %s | addr=0x%8.8X | status=0x%8.8X\n",
727 val & (1 << 24) ? "WRITE" : "READ",
728 (val & 0xFFFFF) >> 2, val);
729 }
730
731 if (status & A5XX_CP_INT_CP_AHB_ERROR) {
732 u32 status = gpu_read(gpu, REG_A5XX_CP_AHB_FAULT);
733 const char *access[16] = { "reserved", "reserved",
734 "timestamp lo", "timestamp hi", "pfp read", "pfp write",
735 "", "", "me read", "me write", "", "", "crashdump read",
736 "crashdump write" };
737
738 dev_err_ratelimited(gpu->dev->dev,
739 "CP | AHB error | addr=%X access=%s error=%d | status=0x%8.8X\n",
740 status & 0xFFFFF, access[(status >> 24) & 0xF],
741 (status & (1 << 31)), status);
742 }
743}
744
Jordan Crouse7352fb52017-03-07 09:50:29 -0700745static void a5xx_rbbm_err_irq(struct msm_gpu *gpu, u32 status)
Jordan Crouseb5f103a2016-11-28 12:28:33 -0700746{
Jordan Crouseb5f103a2016-11-28 12:28:33 -0700747 if (status & A5XX_RBBM_INT_0_MASK_RBBM_AHB_ERROR) {
748 u32 val = gpu_read(gpu, REG_A5XX_RBBM_AHB_ERROR_STATUS);
749
750 dev_err_ratelimited(gpu->dev->dev,
751 "RBBM | AHB bus error | %s | addr=0x%X | ports=0x%X:0x%X\n",
752 val & (1 << 28) ? "WRITE" : "READ",
753 (val & 0xFFFFF) >> 2, (val >> 20) & 0x3,
754 (val >> 24) & 0xF);
755
756 /* Clear the error */
757 gpu_write(gpu, REG_A5XX_RBBM_AHB_CMD, (1 << 4));
Jordan Crouse7352fb52017-03-07 09:50:29 -0700758
759 /* Clear the interrupt */
760 gpu_write(gpu, REG_A5XX_RBBM_INT_CLEAR_CMD,
761 A5XX_RBBM_INT_0_MASK_RBBM_AHB_ERROR);
Jordan Crouseb5f103a2016-11-28 12:28:33 -0700762 }
763
764 if (status & A5XX_RBBM_INT_0_MASK_RBBM_TRANSFER_TIMEOUT)
765 dev_err_ratelimited(gpu->dev->dev, "RBBM | AHB transfer timeout\n");
766
767 if (status & A5XX_RBBM_INT_0_MASK_RBBM_ME_MS_TIMEOUT)
768 dev_err_ratelimited(gpu->dev->dev, "RBBM | ME master split | status=0x%X\n",
769 gpu_read(gpu, REG_A5XX_RBBM_AHB_ME_SPLIT_STATUS));
770
771 if (status & A5XX_RBBM_INT_0_MASK_RBBM_PFP_MS_TIMEOUT)
772 dev_err_ratelimited(gpu->dev->dev, "RBBM | PFP master split | status=0x%X\n",
773 gpu_read(gpu, REG_A5XX_RBBM_AHB_PFP_SPLIT_STATUS));
774
775 if (status & A5XX_RBBM_INT_0_MASK_RBBM_ETS_MS_TIMEOUT)
776 dev_err_ratelimited(gpu->dev->dev, "RBBM | ETS master split | status=0x%X\n",
777 gpu_read(gpu, REG_A5XX_RBBM_AHB_ETS_SPLIT_STATUS));
778
779 if (status & A5XX_RBBM_INT_0_MASK_RBBM_ATB_ASYNC_OVERFLOW)
780 dev_err_ratelimited(gpu->dev->dev, "RBBM | ATB ASYNC overflow\n");
781
782 if (status & A5XX_RBBM_INT_0_MASK_RBBM_ATB_BUS_OVERFLOW)
783 dev_err_ratelimited(gpu->dev->dev, "RBBM | ATB bus overflow\n");
784}
785
786static void a5xx_uche_err_irq(struct msm_gpu *gpu)
787{
788 uint64_t addr = (uint64_t) gpu_read(gpu, REG_A5XX_UCHE_TRAP_LOG_HI);
789
790 addr |= gpu_read(gpu, REG_A5XX_UCHE_TRAP_LOG_LO);
791
792 dev_err_ratelimited(gpu->dev->dev, "UCHE | Out of bounds access | addr=0x%llX\n",
793 addr);
794}
795
796static void a5xx_gpmu_err_irq(struct msm_gpu *gpu)
797{
798 dev_err_ratelimited(gpu->dev->dev, "GPMU | voltage droop\n");
799}
800
Jordan Crouseac1b5ab2017-07-27 10:42:36 -0600801static void a5xx_fault_detect_irq(struct msm_gpu *gpu)
802{
803 struct drm_device *dev = gpu->dev;
804 struct msm_drm_private *priv = dev->dev_private;
Jordan Crouseac1b5ab2017-07-27 10:42:36 -0600805
Jordan Crouse1267a4d2017-07-27 10:42:39 -0600806 dev_err(dev->dev, "gpu fault fence %x status %8.8X rb %4.4x/%4.4x ib1 %16.16llX/%4.4x ib2 %16.16llX/%4.4x\n",
807 gpu->funcs->last_fence(gpu),
Jordan Crouseac1b5ab2017-07-27 10:42:36 -0600808 gpu_read(gpu, REG_A5XX_RBBM_STATUS),
809 gpu_read(gpu, REG_A5XX_CP_RB_RPTR),
810 gpu_read(gpu, REG_A5XX_CP_RB_WPTR),
811 gpu_read64(gpu, REG_A5XX_CP_IB1_BASE, REG_A5XX_CP_IB1_BASE_HI),
812 gpu_read(gpu, REG_A5XX_CP_IB1_BUFSZ),
813 gpu_read64(gpu, REG_A5XX_CP_IB2_BASE, REG_A5XX_CP_IB2_BASE_HI),
814 gpu_read(gpu, REG_A5XX_CP_IB2_BUFSZ));
815
816 /* Turn off the hangcheck timer to keep it from bothering us */
817 del_timer(&gpu->hangcheck_timer);
818
819 queue_work(priv->wq, &gpu->recover_work);
820}
821
Jordan Crouseb5f103a2016-11-28 12:28:33 -0700822#define RBBM_ERROR_MASK \
823 (A5XX_RBBM_INT_0_MASK_RBBM_AHB_ERROR | \
824 A5XX_RBBM_INT_0_MASK_RBBM_TRANSFER_TIMEOUT | \
825 A5XX_RBBM_INT_0_MASK_RBBM_ME_MS_TIMEOUT | \
826 A5XX_RBBM_INT_0_MASK_RBBM_PFP_MS_TIMEOUT | \
827 A5XX_RBBM_INT_0_MASK_RBBM_ETS_MS_TIMEOUT | \
828 A5XX_RBBM_INT_0_MASK_RBBM_ATB_ASYNC_OVERFLOW)
829
830static irqreturn_t a5xx_irq(struct msm_gpu *gpu)
831{
832 u32 status = gpu_read(gpu, REG_A5XX_RBBM_INT_0_STATUS);
833
Jordan Crouse7352fb52017-03-07 09:50:29 -0700834 /*
835 * Clear all the interrupts except RBBM_AHB_ERROR - if we clear it
836 * before the source is cleared the interrupt will storm.
837 */
838 gpu_write(gpu, REG_A5XX_RBBM_INT_CLEAR_CMD,
839 status & ~A5XX_RBBM_INT_0_MASK_RBBM_AHB_ERROR);
Jordan Crouseb5f103a2016-11-28 12:28:33 -0700840
Jordan Crouse7352fb52017-03-07 09:50:29 -0700841 /* Pass status to a5xx_rbbm_err_irq because we've already cleared it */
Jordan Crouseb5f103a2016-11-28 12:28:33 -0700842 if (status & RBBM_ERROR_MASK)
Jordan Crouse7352fb52017-03-07 09:50:29 -0700843 a5xx_rbbm_err_irq(gpu, status);
Jordan Crouseb5f103a2016-11-28 12:28:33 -0700844
845 if (status & A5XX_RBBM_INT_0_MASK_CP_HW_ERROR)
846 a5xx_cp_err_irq(gpu);
847
Jordan Crouseac1b5ab2017-07-27 10:42:36 -0600848 if (status & A5XX_RBBM_INT_0_MASK_MISC_HANG_DETECT)
849 a5xx_fault_detect_irq(gpu);
850
Jordan Crouseb5f103a2016-11-28 12:28:33 -0700851 if (status & A5XX_RBBM_INT_0_MASK_UCHE_OOB_ACCESS)
852 a5xx_uche_err_irq(gpu);
853
854 if (status & A5XX_RBBM_INT_0_MASK_GPMU_VOLTAGE_DROOP)
855 a5xx_gpmu_err_irq(gpu);
856
857 if (status & A5XX_RBBM_INT_0_MASK_CP_CACHE_FLUSH_TS)
858 msm_gpu_retire(gpu);
859
860 return IRQ_HANDLED;
861}
862
863static const u32 a5xx_register_offsets[REG_ADRENO_REGISTER_MAX] = {
864 REG_ADRENO_DEFINE(REG_ADRENO_CP_RB_BASE, REG_A5XX_CP_RB_BASE),
865 REG_ADRENO_DEFINE(REG_ADRENO_CP_RB_BASE_HI, REG_A5XX_CP_RB_BASE_HI),
866 REG_ADRENO_DEFINE(REG_ADRENO_CP_RB_RPTR_ADDR, REG_A5XX_CP_RB_RPTR_ADDR),
867 REG_ADRENO_DEFINE(REG_ADRENO_CP_RB_RPTR_ADDR_HI,
868 REG_A5XX_CP_RB_RPTR_ADDR_HI),
869 REG_ADRENO_DEFINE(REG_ADRENO_CP_RB_RPTR, REG_A5XX_CP_RB_RPTR),
870 REG_ADRENO_DEFINE(REG_ADRENO_CP_RB_WPTR, REG_A5XX_CP_RB_WPTR),
871 REG_ADRENO_DEFINE(REG_ADRENO_CP_RB_CNTL, REG_A5XX_CP_RB_CNTL),
872};
873
874static const u32 a5xx_registers[] = {
875 0x0000, 0x0002, 0x0004, 0x0020, 0x0022, 0x0026, 0x0029, 0x002B,
876 0x002E, 0x0035, 0x0038, 0x0042, 0x0044, 0x0044, 0x0047, 0x0095,
877 0x0097, 0x00BB, 0x03A0, 0x0464, 0x0469, 0x046F, 0x04D2, 0x04D3,
Jordan Crouse3394f562017-07-27 10:42:30 -0600878 0x04E0, 0x0533, 0x0540, 0x0555, 0x0800, 0x081A, 0x081F, 0x0841,
879 0x0860, 0x0860, 0x0880, 0x08A0, 0x0B00, 0x0B12, 0x0B15, 0x0B28,
880 0x0B78, 0x0B7F, 0x0BB0, 0x0BBD, 0x0BC0, 0x0BC6, 0x0BD0, 0x0C53,
881 0x0C60, 0x0C61, 0x0C80, 0x0C82, 0x0C84, 0x0C85, 0x0C90, 0x0C98,
882 0x0CA0, 0x0CA0, 0x0CB0, 0x0CB2, 0x2180, 0x2185, 0x2580, 0x2585,
883 0x0CC1, 0x0CC1, 0x0CC4, 0x0CC7, 0x0CCC, 0x0CCC, 0x0CD0, 0x0CD8,
884 0x0CE0, 0x0CE5, 0x0CE8, 0x0CE8, 0x0CEC, 0x0CF1, 0x0CFB, 0x0D0E,
885 0x2100, 0x211E, 0x2140, 0x2145, 0x2500, 0x251E, 0x2540, 0x2545,
886 0x0D10, 0x0D17, 0x0D20, 0x0D23, 0x0D30, 0x0D30, 0x20C0, 0x20C0,
887 0x24C0, 0x24C0, 0x0E40, 0x0E43, 0x0E4A, 0x0E4A, 0x0E50, 0x0E57,
888 0x0E60, 0x0E7C, 0x0E80, 0x0E8E, 0x0E90, 0x0E96, 0x0EA0, 0x0EA8,
889 0x0EB0, 0x0EB2, 0xE140, 0xE147, 0xE150, 0xE187, 0xE1A0, 0xE1A9,
890 0xE1B0, 0xE1B6, 0xE1C0, 0xE1C7, 0xE1D0, 0xE1D1, 0xE200, 0xE201,
891 0xE210, 0xE21C, 0xE240, 0xE268, 0xE000, 0xE006, 0xE010, 0xE09A,
892 0xE0A0, 0xE0A4, 0xE0AA, 0xE0EB, 0xE100, 0xE105, 0xE380, 0xE38F,
893 0xE3B0, 0xE3B0, 0xE400, 0xE405, 0xE408, 0xE4E9, 0xE4F0, 0xE4F0,
894 0xE280, 0xE280, 0xE282, 0xE2A3, 0xE2A5, 0xE2C2, 0xE940, 0xE947,
895 0xE950, 0xE987, 0xE9A0, 0xE9A9, 0xE9B0, 0xE9B6, 0xE9C0, 0xE9C7,
896 0xE9D0, 0xE9D1, 0xEA00, 0xEA01, 0xEA10, 0xEA1C, 0xEA40, 0xEA68,
897 0xE800, 0xE806, 0xE810, 0xE89A, 0xE8A0, 0xE8A4, 0xE8AA, 0xE8EB,
898 0xE900, 0xE905, 0xEB80, 0xEB8F, 0xEBB0, 0xEBB0, 0xEC00, 0xEC05,
899 0xEC08, 0xECE9, 0xECF0, 0xECF0, 0xEA80, 0xEA80, 0xEA82, 0xEAA3,
900 0xEAA5, 0xEAC2, 0xA800, 0xA8FF, 0xAC60, 0xAC60, 0xB000, 0xB97F,
901 0xB9A0, 0xB9BF, ~0
Jordan Crouseb5f103a2016-11-28 12:28:33 -0700902};
903
904static void a5xx_dump(struct msm_gpu *gpu)
905{
906 dev_info(gpu->dev->dev, "status: %08x\n",
907 gpu_read(gpu, REG_A5XX_RBBM_STATUS));
908 adreno_dump(gpu);
909}
910
911static int a5xx_pm_resume(struct msm_gpu *gpu)
912{
Jordan Crouse2401a002016-11-28 12:28:34 -0700913 int ret;
914
915 /* Turn on the core power */
916 ret = msm_gpu_pm_resume(gpu);
917 if (ret)
918 return ret;
919
920 /* Turn the RBCCU domain first to limit the chances of voltage droop */
921 gpu_write(gpu, REG_A5XX_GPMU_RBCCU_POWER_CNTL, 0x778000);
922
923 /* Wait 3 usecs before polling */
924 udelay(3);
925
926 ret = spin_usecs(gpu, 20, REG_A5XX_GPMU_RBCCU_PWR_CLK_STATUS,
927 (1 << 20), (1 << 20));
928 if (ret) {
929 DRM_ERROR("%s: timeout waiting for RBCCU GDSC enable: %X\n",
930 gpu->name,
931 gpu_read(gpu, REG_A5XX_GPMU_RBCCU_PWR_CLK_STATUS));
932 return ret;
933 }
934
935 /* Turn on the SP domain */
936 gpu_write(gpu, REG_A5XX_GPMU_SP_POWER_CNTL, 0x778000);
937 ret = spin_usecs(gpu, 20, REG_A5XX_GPMU_SP_PWR_CLK_STATUS,
938 (1 << 20), (1 << 20));
939 if (ret)
940 DRM_ERROR("%s: timeout waiting for SP GDSC enable\n",
941 gpu->name);
942
943 return ret;
Jordan Crouseb5f103a2016-11-28 12:28:33 -0700944}
945
946static int a5xx_pm_suspend(struct msm_gpu *gpu)
947{
Jordan Crouse2401a002016-11-28 12:28:34 -0700948 /* Clear the VBIF pipe before shutting down */
949 gpu_write(gpu, REG_A5XX_VBIF_XIN_HALT_CTRL0, 0xF);
950 spin_until((gpu_read(gpu, REG_A5XX_VBIF_XIN_HALT_CTRL1) & 0xF) == 0xF);
951
952 gpu_write(gpu, REG_A5XX_VBIF_XIN_HALT_CTRL0, 0);
953
954 /*
955 * Reset the VBIF before power collapse to avoid issue with FIFO
956 * entries
957 */
958 gpu_write(gpu, REG_A5XX_RBBM_BLOCK_SW_RESET_CMD, 0x003C0000);
959 gpu_write(gpu, REG_A5XX_RBBM_BLOCK_SW_RESET_CMD, 0x00000000);
960
Jordan Crouseb5f103a2016-11-28 12:28:33 -0700961 return msm_gpu_pm_suspend(gpu);
962}
963
964static int a5xx_get_timestamp(struct msm_gpu *gpu, uint64_t *value)
965{
966 *value = gpu_read64(gpu, REG_A5XX_RBBM_PERFCTR_CP_0_LO,
967 REG_A5XX_RBBM_PERFCTR_CP_0_HI);
968
969 return 0;
970}
971
972#ifdef CONFIG_DEBUG_FS
973static void a5xx_show(struct msm_gpu *gpu, struct seq_file *m)
974{
Jordan Crouseb5f103a2016-11-28 12:28:33 -0700975 seq_printf(m, "status: %08x\n",
976 gpu_read(gpu, REG_A5XX_RBBM_STATUS));
Jordan Crousea23cb3b2017-07-27 10:42:32 -0600977
978 /*
979 * Temporarily disable hardware clock gating before going into
980 * adreno_show to avoid issues while reading the registers
981 */
982 a5xx_set_hwcg(gpu, false);
Jordan Crouseb5f103a2016-11-28 12:28:33 -0700983 adreno_show(gpu, m);
Jordan Crousea23cb3b2017-07-27 10:42:32 -0600984 a5xx_set_hwcg(gpu, true);
Jordan Crouseb5f103a2016-11-28 12:28:33 -0700985}
986#endif
987
988static const struct adreno_gpu_funcs funcs = {
989 .base = {
990 .get_param = adreno_get_param,
991 .hw_init = a5xx_hw_init,
992 .pm_suspend = a5xx_pm_suspend,
993 .pm_resume = a5xx_pm_resume,
994 .recover = a5xx_recover,
995 .last_fence = adreno_last_fence,
996 .submit = a5xx_submit,
997 .flush = adreno_flush,
Jordan Crouseb5f103a2016-11-28 12:28:33 -0700998 .irq = a5xx_irq,
999 .destroy = a5xx_destroy,
Arnd Bergmann0c3eaf12017-03-13 17:43:48 +01001000#ifdef CONFIG_DEBUG_FS
Jordan Crouseb5f103a2016-11-28 12:28:33 -07001001 .show = a5xx_show,
Arnd Bergmann0c3eaf12017-03-13 17:43:48 +01001002#endif
Jordan Crouseb5f103a2016-11-28 12:28:33 -07001003 },
1004 .get_timestamp = a5xx_get_timestamp,
1005};
1006
1007struct msm_gpu *a5xx_gpu_init(struct drm_device *dev)
1008{
1009 struct msm_drm_private *priv = dev->dev_private;
1010 struct platform_device *pdev = priv->gpu_pdev;
1011 struct a5xx_gpu *a5xx_gpu = NULL;
1012 struct adreno_gpu *adreno_gpu;
1013 struct msm_gpu *gpu;
1014 int ret;
1015
1016 if (!pdev) {
1017 dev_err(dev->dev, "No A5XX device is defined\n");
1018 return ERR_PTR(-ENXIO);
1019 }
1020
1021 a5xx_gpu = kzalloc(sizeof(*a5xx_gpu), GFP_KERNEL);
1022 if (!a5xx_gpu)
1023 return ERR_PTR(-ENOMEM);
1024
1025 adreno_gpu = &a5xx_gpu->base;
1026 gpu = &adreno_gpu->base;
1027
Jordan Crouseb5f103a2016-11-28 12:28:33 -07001028 adreno_gpu->registers = a5xx_registers;
1029 adreno_gpu->reg_offsets = a5xx_register_offsets;
1030
Jordan Crouse2401a002016-11-28 12:28:34 -07001031 a5xx_gpu->lm_leakage = 0x4E001A;
1032
Jordan Crouseb5f103a2016-11-28 12:28:33 -07001033 ret = adreno_gpu_init(dev, pdev, adreno_gpu, &funcs);
1034 if (ret) {
1035 a5xx_destroy(&(a5xx_gpu->base.base));
1036 return ERR_PTR(ret);
1037 }
1038
Rob Clark7f8036b2016-12-07 11:13:53 -05001039 if (gpu->aspace)
1040 msm_mmu_set_fault_handler(gpu->aspace->mmu, gpu, a5xx_fault_handler);
1041
Jordan Crouseb5f103a2016-11-28 12:28:33 -07001042 return gpu;
1043}