blob: 9cc4ba8d03d57f10350c44e22824b166ebd7f1d6 [file] [log] [blame]
Jerome Glisse3ce0a232009-09-08 10:10:24 +10001/*
2 * Copyright 2008 Advanced Micro Devices, Inc.
3 * Copyright 2008 Red Hat Inc.
4 * Copyright 2009 Jerome Glisse.
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the "Software"),
8 * to deal in the Software without restriction, including without limitation
9 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
10 * and/or sell copies of the Software, and to permit persons to whom the
11 * Software is furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice shall be included in
14 * all copies or substantial portions of the Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
20 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
21 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
22 * OTHER DEALINGS IN THE SOFTWARE.
23 *
24 * Authors: Dave Airlie
25 * Alex Deucher
26 * Jerome Glisse
27 */
28#include "drmP.h"
29#include "radeon.h"
Jerome Glisse3ce0a232009-09-08 10:10:24 +100030#include "r600d.h"
Jerome Glisse3ce0a232009-09-08 10:10:24 +100031
32static int r600_cs_packet_next_reloc_mm(struct radeon_cs_parser *p,
33 struct radeon_cs_reloc **cs_reloc);
34static int r600_cs_packet_next_reloc_nomm(struct radeon_cs_parser *p,
35 struct radeon_cs_reloc **cs_reloc);
36typedef int (*next_reloc_t)(struct radeon_cs_parser*, struct radeon_cs_reloc**);
37static next_reloc_t r600_cs_packet_next_reloc = &r600_cs_packet_next_reloc_mm;
38
Jerome Glissec8c15ff2010-01-18 13:01:36 +010039struct r600_cs_track {
40 u32 cb_color0_base_last;
41};
42
Jerome Glisse3ce0a232009-09-08 10:10:24 +100043/**
44 * r600_cs_packet_parse() - parse cp packet and point ib index to next packet
45 * @parser: parser structure holding parsing context.
46 * @pkt: where to store packet informations
47 *
48 * Assume that chunk_ib_index is properly set. Will return -EINVAL
49 * if packet is bigger than remaining ib size. or if packets is unknown.
50 **/
51int r600_cs_packet_parse(struct radeon_cs_parser *p,
52 struct radeon_cs_packet *pkt,
53 unsigned idx)
54{
55 struct radeon_cs_chunk *ib_chunk = &p->chunks[p->chunk_ib_idx];
56 uint32_t header;
57
58 if (idx >= ib_chunk->length_dw) {
59 DRM_ERROR("Can not parse packet at %d after CS end %d !\n",
60 idx, ib_chunk->length_dw);
61 return -EINVAL;
62 }
Dave Airlie513bcb42009-09-23 16:56:27 +100063 header = radeon_get_ib_value(p, idx);
Jerome Glisse3ce0a232009-09-08 10:10:24 +100064 pkt->idx = idx;
65 pkt->type = CP_PACKET_GET_TYPE(header);
66 pkt->count = CP_PACKET_GET_COUNT(header);
67 pkt->one_reg_wr = 0;
68 switch (pkt->type) {
69 case PACKET_TYPE0:
70 pkt->reg = CP_PACKET0_GET_REG(header);
71 break;
72 case PACKET_TYPE3:
73 pkt->opcode = CP_PACKET3_GET_OPCODE(header);
74 break;
75 case PACKET_TYPE2:
76 pkt->count = -1;
77 break;
78 default:
79 DRM_ERROR("Unknown packet type %d at %d !\n", pkt->type, idx);
80 return -EINVAL;
81 }
82 if ((pkt->count + 1 + pkt->idx) >= ib_chunk->length_dw) {
83 DRM_ERROR("Packet (%d:%d:%d) end after CS buffer (%d) !\n",
84 pkt->idx, pkt->type, pkt->count, ib_chunk->length_dw);
85 return -EINVAL;
86 }
87 return 0;
88}
89
90/**
91 * r600_cs_packet_next_reloc_mm() - parse next packet which should be reloc packet3
92 * @parser: parser structure holding parsing context.
93 * @data: pointer to relocation data
94 * @offset_start: starting offset
95 * @offset_mask: offset mask (to align start offset on)
96 * @reloc: reloc informations
97 *
98 * Check next packet is relocation packet3, do bo validation and compute
99 * GPU offset using the provided start.
100 **/
101static int r600_cs_packet_next_reloc_mm(struct radeon_cs_parser *p,
102 struct radeon_cs_reloc **cs_reloc)
103{
Jerome Glisse3ce0a232009-09-08 10:10:24 +1000104 struct radeon_cs_chunk *relocs_chunk;
105 struct radeon_cs_packet p3reloc;
106 unsigned idx;
107 int r;
108
109 if (p->chunk_relocs_idx == -1) {
110 DRM_ERROR("No relocation chunk !\n");
111 return -EINVAL;
112 }
113 *cs_reloc = NULL;
Jerome Glisse3ce0a232009-09-08 10:10:24 +1000114 relocs_chunk = &p->chunks[p->chunk_relocs_idx];
115 r = r600_cs_packet_parse(p, &p3reloc, p->idx);
116 if (r) {
117 return r;
118 }
119 p->idx += p3reloc.count + 2;
120 if (p3reloc.type != PACKET_TYPE3 || p3reloc.opcode != PACKET3_NOP) {
121 DRM_ERROR("No packet3 for relocation for packet at %d.\n",
122 p3reloc.idx);
123 return -EINVAL;
124 }
Dave Airlie513bcb42009-09-23 16:56:27 +1000125 idx = radeon_get_ib_value(p, p3reloc.idx + 1);
Jerome Glisse3ce0a232009-09-08 10:10:24 +1000126 if (idx >= relocs_chunk->length_dw) {
127 DRM_ERROR("Relocs at %d after relocations chunk end %d !\n",
128 idx, relocs_chunk->length_dw);
129 return -EINVAL;
130 }
131 /* FIXME: we assume reloc size is 4 dwords */
132 *cs_reloc = p->relocs_ptr[(idx / 4)];
133 return 0;
134}
135
136/**
137 * r600_cs_packet_next_reloc_nomm() - parse next packet which should be reloc packet3
138 * @parser: parser structure holding parsing context.
139 * @data: pointer to relocation data
140 * @offset_start: starting offset
141 * @offset_mask: offset mask (to align start offset on)
142 * @reloc: reloc informations
143 *
144 * Check next packet is relocation packet3, do bo validation and compute
145 * GPU offset using the provided start.
146 **/
147static int r600_cs_packet_next_reloc_nomm(struct radeon_cs_parser *p,
148 struct radeon_cs_reloc **cs_reloc)
149{
Jerome Glisse3ce0a232009-09-08 10:10:24 +1000150 struct radeon_cs_chunk *relocs_chunk;
151 struct radeon_cs_packet p3reloc;
152 unsigned idx;
153 int r;
154
155 if (p->chunk_relocs_idx == -1) {
156 DRM_ERROR("No relocation chunk !\n");
157 return -EINVAL;
158 }
159 *cs_reloc = NULL;
Jerome Glisse3ce0a232009-09-08 10:10:24 +1000160 relocs_chunk = &p->chunks[p->chunk_relocs_idx];
161 r = r600_cs_packet_parse(p, &p3reloc, p->idx);
162 if (r) {
163 return r;
164 }
165 p->idx += p3reloc.count + 2;
166 if (p3reloc.type != PACKET_TYPE3 || p3reloc.opcode != PACKET3_NOP) {
167 DRM_ERROR("No packet3 for relocation for packet at %d.\n",
168 p3reloc.idx);
169 return -EINVAL;
170 }
Dave Airlie513bcb42009-09-23 16:56:27 +1000171 idx = radeon_get_ib_value(p, p3reloc.idx + 1);
Jerome Glisse3ce0a232009-09-08 10:10:24 +1000172 if (idx >= relocs_chunk->length_dw) {
173 DRM_ERROR("Relocs at %d after relocations chunk end %d !\n",
174 idx, relocs_chunk->length_dw);
175 return -EINVAL;
176 }
Julia Lawalle265f39e2009-12-19 08:16:33 +0100177 *cs_reloc = p->relocs;
Jerome Glisse3ce0a232009-09-08 10:10:24 +1000178 (*cs_reloc)->lobj.gpu_offset = (u64)relocs_chunk->kdata[idx + 3] << 32;
179 (*cs_reloc)->lobj.gpu_offset |= relocs_chunk->kdata[idx + 0];
180 return 0;
181}
182
Alex Deucher2f67c6e2009-09-25 16:35:11 -0400183/**
Jerome Glissec8c15ff2010-01-18 13:01:36 +0100184 * r600_cs_packet_next_is_pkt3_nop() - test if next packet is packet3 nop for reloc
185 * @parser: parser structure holding parsing context.
186 *
187 * Check next packet is relocation packet3, do bo validation and compute
188 * GPU offset using the provided start.
189 **/
190static inline int r600_cs_packet_next_is_pkt3_nop(struct radeon_cs_parser *p)
191{
192 struct radeon_cs_packet p3reloc;
193 int r;
194
195 r = r600_cs_packet_parse(p, &p3reloc, p->idx);
196 if (r) {
197 return 0;
198 }
199 if (p3reloc.type != PACKET_TYPE3 || p3reloc.opcode != PACKET3_NOP) {
200 return 0;
201 }
202 return 1;
203}
204
205/**
Alex Deucher2f67c6e2009-09-25 16:35:11 -0400206 * r600_cs_packet_next_vline() - parse userspace VLINE packet
207 * @parser: parser structure holding parsing context.
208 *
209 * Userspace sends a special sequence for VLINE waits.
210 * PACKET0 - VLINE_START_END + value
211 * PACKET3 - WAIT_REG_MEM poll vline status reg
212 * RELOC (P3) - crtc_id in reloc.
213 *
214 * This function parses this and relocates the VLINE START END
215 * and WAIT_REG_MEM packets to the correct crtc.
216 * It also detects a switched off crtc and nulls out the
217 * wait in that case.
218 */
219static int r600_cs_packet_parse_vline(struct radeon_cs_parser *p)
220{
221 struct drm_mode_object *obj;
222 struct drm_crtc *crtc;
223 struct radeon_crtc *radeon_crtc;
224 struct radeon_cs_packet p3reloc, wait_reg_mem;
225 int crtc_id;
226 int r;
227 uint32_t header, h_idx, reg, wait_reg_mem_info;
228 volatile uint32_t *ib;
229
230 ib = p->ib->ptr;
231
232 /* parse the WAIT_REG_MEM */
233 r = r600_cs_packet_parse(p, &wait_reg_mem, p->idx);
234 if (r)
235 return r;
236
237 /* check its a WAIT_REG_MEM */
238 if (wait_reg_mem.type != PACKET_TYPE3 ||
239 wait_reg_mem.opcode != PACKET3_WAIT_REG_MEM) {
240 DRM_ERROR("vline wait missing WAIT_REG_MEM segment\n");
241 r = -EINVAL;
242 return r;
243 }
244
245 wait_reg_mem_info = radeon_get_ib_value(p, wait_reg_mem.idx + 1);
246 /* bit 4 is reg (0) or mem (1) */
247 if (wait_reg_mem_info & 0x10) {
248 DRM_ERROR("vline WAIT_REG_MEM waiting on MEM rather than REG\n");
249 r = -EINVAL;
250 return r;
251 }
252 /* waiting for value to be equal */
253 if ((wait_reg_mem_info & 0x7) != 0x3) {
254 DRM_ERROR("vline WAIT_REG_MEM function not equal\n");
255 r = -EINVAL;
256 return r;
257 }
258 if ((radeon_get_ib_value(p, wait_reg_mem.idx + 2) << 2) != AVIVO_D1MODE_VLINE_STATUS) {
259 DRM_ERROR("vline WAIT_REG_MEM bad reg\n");
260 r = -EINVAL;
261 return r;
262 }
263
264 if (radeon_get_ib_value(p, wait_reg_mem.idx + 5) != AVIVO_D1MODE_VLINE_STAT) {
265 DRM_ERROR("vline WAIT_REG_MEM bad bit mask\n");
266 r = -EINVAL;
267 return r;
268 }
269
270 /* jump over the NOP */
271 r = r600_cs_packet_parse(p, &p3reloc, p->idx + wait_reg_mem.count + 2);
272 if (r)
273 return r;
274
275 h_idx = p->idx - 2;
276 p->idx += wait_reg_mem.count + 2;
277 p->idx += p3reloc.count + 2;
278
279 header = radeon_get_ib_value(p, h_idx);
280 crtc_id = radeon_get_ib_value(p, h_idx + 2 + 7 + 1);
Dave Airlied4ac6a02009-10-08 11:32:49 +1000281 reg = CP_PACKET0_GET_REG(header);
Alex Deucher2f67c6e2009-09-25 16:35:11 -0400282 mutex_lock(&p->rdev->ddev->mode_config.mutex);
283 obj = drm_mode_object_find(p->rdev->ddev, crtc_id, DRM_MODE_OBJECT_CRTC);
284 if (!obj) {
285 DRM_ERROR("cannot find crtc %d\n", crtc_id);
286 r = -EINVAL;
287 goto out;
288 }
289 crtc = obj_to_crtc(obj);
290 radeon_crtc = to_radeon_crtc(crtc);
291 crtc_id = radeon_crtc->crtc_id;
292
293 if (!crtc->enabled) {
294 /* if the CRTC isn't enabled - we need to nop out the WAIT_REG_MEM */
295 ib[h_idx + 2] = PACKET2(0);
296 ib[h_idx + 3] = PACKET2(0);
297 ib[h_idx + 4] = PACKET2(0);
298 ib[h_idx + 5] = PACKET2(0);
299 ib[h_idx + 6] = PACKET2(0);
300 ib[h_idx + 7] = PACKET2(0);
301 ib[h_idx + 8] = PACKET2(0);
302 } else if (crtc_id == 1) {
303 switch (reg) {
304 case AVIVO_D1MODE_VLINE_START_END:
305 header &= ~R600_CP_PACKET0_REG_MASK;
306 header |= AVIVO_D2MODE_VLINE_START_END >> 2;
307 break;
308 default:
309 DRM_ERROR("unknown crtc reloc\n");
310 r = -EINVAL;
311 goto out;
312 }
313 ib[h_idx] = header;
314 ib[h_idx + 4] = AVIVO_D2MODE_VLINE_STATUS >> 2;
315 }
316out:
317 mutex_unlock(&p->rdev->ddev->mode_config.mutex);
318 return r;
319}
320
Jerome Glisse3ce0a232009-09-08 10:10:24 +1000321static int r600_packet0_check(struct radeon_cs_parser *p,
322 struct radeon_cs_packet *pkt,
323 unsigned idx, unsigned reg)
324{
Alex Deucher2f67c6e2009-09-25 16:35:11 -0400325 int r;
326
Jerome Glisse3ce0a232009-09-08 10:10:24 +1000327 switch (reg) {
328 case AVIVO_D1MODE_VLINE_START_END:
Alex Deucher2f67c6e2009-09-25 16:35:11 -0400329 r = r600_cs_packet_parse_vline(p);
330 if (r) {
331 DRM_ERROR("No reloc for ib[%d]=0x%04X\n",
332 idx, reg);
333 return r;
334 }
Jerome Glisse3ce0a232009-09-08 10:10:24 +1000335 break;
336 default:
337 printk(KERN_ERR "Forbidden register 0x%04X in cs at %d\n",
338 reg, idx);
339 return -EINVAL;
340 }
341 return 0;
342}
343
344static int r600_cs_parse_packet0(struct radeon_cs_parser *p,
345 struct radeon_cs_packet *pkt)
346{
347 unsigned reg, i;
348 unsigned idx;
349 int r;
350
351 idx = pkt->idx + 1;
352 reg = pkt->reg;
353 for (i = 0; i <= pkt->count; i++, idx++, reg += 4) {
354 r = r600_packet0_check(p, pkt, idx, reg);
355 if (r) {
356 return r;
357 }
358 }
359 return 0;
360}
361
362static int r600_packet3_check(struct radeon_cs_parser *p,
363 struct radeon_cs_packet *pkt)
364{
Jerome Glisse3ce0a232009-09-08 10:10:24 +1000365 struct radeon_cs_reloc *reloc;
Jerome Glissec8c15ff2010-01-18 13:01:36 +0100366 struct r600_cs_track *track;
Jerome Glisse3ce0a232009-09-08 10:10:24 +1000367 volatile u32 *ib;
368 unsigned idx;
369 unsigned i;
370 unsigned start_reg, end_reg, reg;
371 int r;
Dave Airlieadea4792009-09-25 14:23:47 +1000372 u32 idx_value;
Jerome Glisse3ce0a232009-09-08 10:10:24 +1000373
Jerome Glissec8c15ff2010-01-18 13:01:36 +0100374 track = (struct r600_cs_track *)p->track;
Jerome Glisse3ce0a232009-09-08 10:10:24 +1000375 ib = p->ib->ptr;
Jerome Glisse3ce0a232009-09-08 10:10:24 +1000376 idx = pkt->idx + 1;
Dave Airlieadea4792009-09-25 14:23:47 +1000377 idx_value = radeon_get_ib_value(p, idx);
Dave Airlie513bcb42009-09-23 16:56:27 +1000378
Jerome Glisse3ce0a232009-09-08 10:10:24 +1000379 switch (pkt->opcode) {
380 case PACKET3_START_3D_CMDBUF:
381 if (p->family >= CHIP_RV770 || pkt->count) {
382 DRM_ERROR("bad START_3D\n");
383 return -EINVAL;
384 }
385 break;
386 case PACKET3_CONTEXT_CONTROL:
387 if (pkt->count != 1) {
388 DRM_ERROR("bad CONTEXT_CONTROL\n");
389 return -EINVAL;
390 }
391 break;
392 case PACKET3_INDEX_TYPE:
393 case PACKET3_NUM_INSTANCES:
394 if (pkt->count) {
395 DRM_ERROR("bad INDEX_TYPE/NUM_INSTANCES\n");
396 return -EINVAL;
397 }
398 break;
399 case PACKET3_DRAW_INDEX:
400 if (pkt->count != 3) {
401 DRM_ERROR("bad DRAW_INDEX\n");
402 return -EINVAL;
403 }
404 r = r600_cs_packet_next_reloc(p, &reloc);
405 if (r) {
406 DRM_ERROR("bad DRAW_INDEX\n");
407 return -EINVAL;
408 }
Dave Airlieadea4792009-09-25 14:23:47 +1000409 ib[idx+0] = idx_value + (u32)(reloc->lobj.gpu_offset & 0xffffffff);
Alex Deucher210bed82009-09-25 18:33:08 -0400410 ib[idx+1] += upper_32_bits(reloc->lobj.gpu_offset) & 0xff;
Jerome Glisse3ce0a232009-09-08 10:10:24 +1000411 break;
412 case PACKET3_DRAW_INDEX_AUTO:
413 if (pkt->count != 1) {
414 DRM_ERROR("bad DRAW_INDEX_AUTO\n");
415 return -EINVAL;
416 }
417 break;
418 case PACKET3_DRAW_INDEX_IMMD_BE:
419 case PACKET3_DRAW_INDEX_IMMD:
420 if (pkt->count < 2) {
421 DRM_ERROR("bad DRAW_INDEX_IMMD\n");
422 return -EINVAL;
423 }
424 break;
425 case PACKET3_WAIT_REG_MEM:
426 if (pkt->count != 5) {
427 DRM_ERROR("bad WAIT_REG_MEM\n");
428 return -EINVAL;
429 }
430 /* bit 4 is reg (0) or mem (1) */
Dave Airlieadea4792009-09-25 14:23:47 +1000431 if (idx_value & 0x10) {
Jerome Glisse3ce0a232009-09-08 10:10:24 +1000432 r = r600_cs_packet_next_reloc(p, &reloc);
433 if (r) {
434 DRM_ERROR("bad WAIT_REG_MEM\n");
435 return -EINVAL;
436 }
437 ib[idx+1] += (u32)(reloc->lobj.gpu_offset & 0xffffffff);
Alex Deucher210bed82009-09-25 18:33:08 -0400438 ib[idx+2] += upper_32_bits(reloc->lobj.gpu_offset) & 0xff;
Jerome Glisse3ce0a232009-09-08 10:10:24 +1000439 }
440 break;
441 case PACKET3_SURFACE_SYNC:
442 if (pkt->count != 3) {
443 DRM_ERROR("bad SURFACE_SYNC\n");
444 return -EINVAL;
445 }
446 /* 0xffffffff/0x0 is flush all cache flag */
Dave Airlie513bcb42009-09-23 16:56:27 +1000447 if (radeon_get_ib_value(p, idx + 1) != 0xffffffff ||
448 radeon_get_ib_value(p, idx + 2) != 0) {
Jerome Glisse3ce0a232009-09-08 10:10:24 +1000449 r = r600_cs_packet_next_reloc(p, &reloc);
450 if (r) {
451 DRM_ERROR("bad SURFACE_SYNC\n");
452 return -EINVAL;
453 }
454 ib[idx+2] += (u32)((reloc->lobj.gpu_offset >> 8) & 0xffffffff);
455 }
456 break;
457 case PACKET3_EVENT_WRITE:
458 if (pkt->count != 2 && pkt->count != 0) {
459 DRM_ERROR("bad EVENT_WRITE\n");
460 return -EINVAL;
461 }
462 if (pkt->count) {
463 r = r600_cs_packet_next_reloc(p, &reloc);
464 if (r) {
465 DRM_ERROR("bad EVENT_WRITE\n");
466 return -EINVAL;
467 }
468 ib[idx+1] += (u32)(reloc->lobj.gpu_offset & 0xffffffff);
Alex Deucher210bed82009-09-25 18:33:08 -0400469 ib[idx+2] += upper_32_bits(reloc->lobj.gpu_offset) & 0xff;
Jerome Glisse3ce0a232009-09-08 10:10:24 +1000470 }
471 break;
472 case PACKET3_EVENT_WRITE_EOP:
473 if (pkt->count != 4) {
474 DRM_ERROR("bad EVENT_WRITE_EOP\n");
475 return -EINVAL;
476 }
477 r = r600_cs_packet_next_reloc(p, &reloc);
478 if (r) {
479 DRM_ERROR("bad EVENT_WRITE\n");
480 return -EINVAL;
481 }
482 ib[idx+1] += (u32)(reloc->lobj.gpu_offset & 0xffffffff);
Alex Deucher210bed82009-09-25 18:33:08 -0400483 ib[idx+2] += upper_32_bits(reloc->lobj.gpu_offset) & 0xff;
Jerome Glisse3ce0a232009-09-08 10:10:24 +1000484 break;
485 case PACKET3_SET_CONFIG_REG:
Dave Airlieadea4792009-09-25 14:23:47 +1000486 start_reg = (idx_value << 2) + PACKET3_SET_CONFIG_REG_OFFSET;
Jerome Glisse3ce0a232009-09-08 10:10:24 +1000487 end_reg = 4 * pkt->count + start_reg - 4;
488 if ((start_reg < PACKET3_SET_CONFIG_REG_OFFSET) ||
489 (start_reg >= PACKET3_SET_CONFIG_REG_END) ||
490 (end_reg >= PACKET3_SET_CONFIG_REG_END)) {
491 DRM_ERROR("bad PACKET3_SET_CONFIG_REG\n");
492 return -EINVAL;
493 }
494 for (i = 0; i < pkt->count; i++) {
495 reg = start_reg + (4 * i);
496 switch (reg) {
Alex Deuchera39533b2009-11-09 16:41:21 -0500497 case SQ_ESGS_RING_BASE:
498 case SQ_GSVS_RING_BASE:
499 case SQ_ESTMP_RING_BASE:
500 case SQ_GSTMP_RING_BASE:
501 case SQ_VSTMP_RING_BASE:
502 case SQ_PSTMP_RING_BASE:
503 case SQ_FBUF_RING_BASE:
504 case SQ_REDUC_RING_BASE:
505 case SX_MEMORY_EXPORT_BASE:
506 r = r600_cs_packet_next_reloc(p, &reloc);
507 if (r) {
508 DRM_ERROR("bad SET_CONFIG_REG "
509 "0x%04X\n", reg);
510 return -EINVAL;
511 }
512 ib[idx+1+i] += (u32)((reloc->lobj.gpu_offset >> 8) & 0xffffffff);
513 break;
Jerome Glisse3ce0a232009-09-08 10:10:24 +1000514 case CP_COHER_BASE:
515 /* use PACKET3_SURFACE_SYNC */
516 return -EINVAL;
517 default:
518 break;
519 }
520 }
521 break;
522 case PACKET3_SET_CONTEXT_REG:
Dave Airlieadea4792009-09-25 14:23:47 +1000523 start_reg = (idx_value << 2) + PACKET3_SET_CONTEXT_REG_OFFSET;
Jerome Glisse3ce0a232009-09-08 10:10:24 +1000524 end_reg = 4 * pkt->count + start_reg - 4;
525 if ((start_reg < PACKET3_SET_CONTEXT_REG_OFFSET) ||
526 (start_reg >= PACKET3_SET_CONTEXT_REG_END) ||
527 (end_reg >= PACKET3_SET_CONTEXT_REG_END)) {
528 DRM_ERROR("bad PACKET3_SET_CONTEXT_REG\n");
529 return -EINVAL;
530 }
531 for (i = 0; i < pkt->count; i++) {
532 reg = start_reg + (4 * i);
533 switch (reg) {
Jerome Glissec8c15ff2010-01-18 13:01:36 +0100534 /* This register were added late, there is userspace
535 * which does provide relocation for those but set
536 * 0 offset. In order to avoid breaking old userspace
537 * we detect this and set address to point to last
538 * CB_COLOR0_BASE, note that if userspace doesn't set
539 * CB_COLOR0_BASE before this register we will report
540 * error. Old userspace always set CB_COLOR0_BASE
541 * before any of this.
542 */
543 case R_0280E0_CB_COLOR0_FRAG:
544 case R_0280E4_CB_COLOR1_FRAG:
545 case R_0280E8_CB_COLOR2_FRAG:
546 case R_0280EC_CB_COLOR3_FRAG:
547 case R_0280F0_CB_COLOR4_FRAG:
548 case R_0280F4_CB_COLOR5_FRAG:
549 case R_0280F8_CB_COLOR6_FRAG:
550 case R_0280FC_CB_COLOR7_FRAG:
551 case R_0280C0_CB_COLOR0_TILE:
552 case R_0280C4_CB_COLOR1_TILE:
553 case R_0280C8_CB_COLOR2_TILE:
554 case R_0280CC_CB_COLOR3_TILE:
555 case R_0280D0_CB_COLOR4_TILE:
556 case R_0280D4_CB_COLOR5_TILE:
557 case R_0280D8_CB_COLOR6_TILE:
558 case R_0280DC_CB_COLOR7_TILE:
559 if (!r600_cs_packet_next_is_pkt3_nop(p)) {
560 if (!track->cb_color0_base_last) {
561 dev_err(p->dev, "Broken old userspace ? no cb_color0_base supplied before trying to write 0x%08X\n", reg);
562 return -EINVAL;
563 }
564 ib[idx+1+i] = track->cb_color0_base_last;
565 printk_once(KERN_WARNING "You have old & broken userspace "
566 "please consider updating mesa & xf86-video-ati\n");
567 } else {
568 r = r600_cs_packet_next_reloc(p, &reloc);
569 if (r) {
570 dev_err(p->dev, "bad SET_CONTEXT_REG 0x%04X\n", reg);
571 return -EINVAL;
572 }
573 ib[idx+1+i] += (u32)((reloc->lobj.gpu_offset >> 8) & 0xffffffff);
574 }
575 break;
Jerome Glisse3ce0a232009-09-08 10:10:24 +1000576 case DB_DEPTH_BASE:
Alex Deuchera39533b2009-11-09 16:41:21 -0500577 case DB_HTILE_DATA_BASE:
Jerome Glisse3ce0a232009-09-08 10:10:24 +1000578 case CB_COLOR0_BASE:
Jerome Glissec8c15ff2010-01-18 13:01:36 +0100579 r = r600_cs_packet_next_reloc(p, &reloc);
580 if (r) {
581 DRM_ERROR("bad SET_CONTEXT_REG "
582 "0x%04X\n", reg);
583 return -EINVAL;
584 }
585 ib[idx+1+i] += (u32)((reloc->lobj.gpu_offset >> 8) & 0xffffffff);
586 track->cb_color0_base_last = ib[idx+1+i];
587 break;
Jerome Glisse3ce0a232009-09-08 10:10:24 +1000588 case CB_COLOR1_BASE:
589 case CB_COLOR2_BASE:
590 case CB_COLOR3_BASE:
591 case CB_COLOR4_BASE:
592 case CB_COLOR5_BASE:
593 case CB_COLOR6_BASE:
594 case CB_COLOR7_BASE:
595 case SQ_PGM_START_FS:
596 case SQ_PGM_START_ES:
597 case SQ_PGM_START_VS:
598 case SQ_PGM_START_GS:
599 case SQ_PGM_START_PS:
600 r = r600_cs_packet_next_reloc(p, &reloc);
601 if (r) {
602 DRM_ERROR("bad SET_CONTEXT_REG "
603 "0x%04X\n", reg);
604 return -EINVAL;
605 }
606 ib[idx+1+i] += (u32)((reloc->lobj.gpu_offset >> 8) & 0xffffffff);
607 break;
608 case VGT_DMA_BASE:
609 case VGT_DMA_BASE_HI:
610 /* These should be handled by DRAW_INDEX packet 3 */
611 case VGT_STRMOUT_BASE_OFFSET_0:
612 case VGT_STRMOUT_BASE_OFFSET_1:
613 case VGT_STRMOUT_BASE_OFFSET_2:
614 case VGT_STRMOUT_BASE_OFFSET_3:
615 case VGT_STRMOUT_BASE_OFFSET_HI_0:
616 case VGT_STRMOUT_BASE_OFFSET_HI_1:
617 case VGT_STRMOUT_BASE_OFFSET_HI_2:
618 case VGT_STRMOUT_BASE_OFFSET_HI_3:
619 case VGT_STRMOUT_BUFFER_BASE_0:
620 case VGT_STRMOUT_BUFFER_BASE_1:
621 case VGT_STRMOUT_BUFFER_BASE_2:
622 case VGT_STRMOUT_BUFFER_BASE_3:
623 case VGT_STRMOUT_BUFFER_OFFSET_0:
624 case VGT_STRMOUT_BUFFER_OFFSET_1:
625 case VGT_STRMOUT_BUFFER_OFFSET_2:
626 case VGT_STRMOUT_BUFFER_OFFSET_3:
627 /* These should be handled by STRMOUT_BUFFER packet 3 */
628 DRM_ERROR("bad context reg: 0x%08x\n", reg);
629 return -EINVAL;
630 default:
631 break;
632 }
633 }
634 break;
635 case PACKET3_SET_RESOURCE:
636 if (pkt->count % 7) {
637 DRM_ERROR("bad SET_RESOURCE\n");
638 return -EINVAL;
639 }
Dave Airlieadea4792009-09-25 14:23:47 +1000640 start_reg = (idx_value << 2) + PACKET3_SET_RESOURCE_OFFSET;
Jerome Glisse3ce0a232009-09-08 10:10:24 +1000641 end_reg = 4 * pkt->count + start_reg - 4;
642 if ((start_reg < PACKET3_SET_RESOURCE_OFFSET) ||
643 (start_reg >= PACKET3_SET_RESOURCE_END) ||
644 (end_reg >= PACKET3_SET_RESOURCE_END)) {
645 DRM_ERROR("bad SET_RESOURCE\n");
646 return -EINVAL;
647 }
648 for (i = 0; i < (pkt->count / 7); i++) {
Dave Airlieadea4792009-09-25 14:23:47 +1000649 switch (G__SQ_VTX_CONSTANT_TYPE(radeon_get_ib_value(p, idx+(i*7)+6+1))) {
Jerome Glisse3ce0a232009-09-08 10:10:24 +1000650 case SQ_TEX_VTX_VALID_TEXTURE:
651 /* tex base */
652 r = r600_cs_packet_next_reloc(p, &reloc);
653 if (r) {
654 DRM_ERROR("bad SET_RESOURCE\n");
655 return -EINVAL;
656 }
657 ib[idx+1+(i*7)+2] += (u32)((reloc->lobj.gpu_offset >> 8) & 0xffffffff);
658 /* tex mip base */
659 r = r600_cs_packet_next_reloc(p, &reloc);
660 if (r) {
661 DRM_ERROR("bad SET_RESOURCE\n");
662 return -EINVAL;
663 }
664 ib[idx+1+(i*7)+3] += (u32)((reloc->lobj.gpu_offset >> 8) & 0xffffffff);
665 break;
666 case SQ_TEX_VTX_VALID_BUFFER:
667 /* vtx base */
668 r = r600_cs_packet_next_reloc(p, &reloc);
669 if (r) {
670 DRM_ERROR("bad SET_RESOURCE\n");
671 return -EINVAL;
672 }
673 ib[idx+1+(i*7)+0] += (u32)((reloc->lobj.gpu_offset) & 0xffffffff);
Alex Deucher210bed82009-09-25 18:33:08 -0400674 ib[idx+1+(i*7)+2] += upper_32_bits(reloc->lobj.gpu_offset) & 0xff;
Jerome Glisse3ce0a232009-09-08 10:10:24 +1000675 break;
676 case SQ_TEX_VTX_INVALID_TEXTURE:
677 case SQ_TEX_VTX_INVALID_BUFFER:
678 default:
679 DRM_ERROR("bad SET_RESOURCE\n");
680 return -EINVAL;
681 }
682 }
683 break;
684 case PACKET3_SET_ALU_CONST:
Dave Airlieadea4792009-09-25 14:23:47 +1000685 start_reg = (idx_value << 2) + PACKET3_SET_ALU_CONST_OFFSET;
Jerome Glisse3ce0a232009-09-08 10:10:24 +1000686 end_reg = 4 * pkt->count + start_reg - 4;
687 if ((start_reg < PACKET3_SET_ALU_CONST_OFFSET) ||
688 (start_reg >= PACKET3_SET_ALU_CONST_END) ||
689 (end_reg >= PACKET3_SET_ALU_CONST_END)) {
690 DRM_ERROR("bad SET_ALU_CONST\n");
691 return -EINVAL;
692 }
693 break;
694 case PACKET3_SET_BOOL_CONST:
Dave Airlieadea4792009-09-25 14:23:47 +1000695 start_reg = (idx_value << 2) + PACKET3_SET_BOOL_CONST_OFFSET;
Jerome Glisse3ce0a232009-09-08 10:10:24 +1000696 end_reg = 4 * pkt->count + start_reg - 4;
697 if ((start_reg < PACKET3_SET_BOOL_CONST_OFFSET) ||
698 (start_reg >= PACKET3_SET_BOOL_CONST_END) ||
699 (end_reg >= PACKET3_SET_BOOL_CONST_END)) {
700 DRM_ERROR("bad SET_BOOL_CONST\n");
701 return -EINVAL;
702 }
703 break;
704 case PACKET3_SET_LOOP_CONST:
Dave Airlieadea4792009-09-25 14:23:47 +1000705 start_reg = (idx_value << 2) + PACKET3_SET_LOOP_CONST_OFFSET;
Jerome Glisse3ce0a232009-09-08 10:10:24 +1000706 end_reg = 4 * pkt->count + start_reg - 4;
707 if ((start_reg < PACKET3_SET_LOOP_CONST_OFFSET) ||
708 (start_reg >= PACKET3_SET_LOOP_CONST_END) ||
709 (end_reg >= PACKET3_SET_LOOP_CONST_END)) {
710 DRM_ERROR("bad SET_LOOP_CONST\n");
711 return -EINVAL;
712 }
713 break;
714 case PACKET3_SET_CTL_CONST:
Dave Airlieadea4792009-09-25 14:23:47 +1000715 start_reg = (idx_value << 2) + PACKET3_SET_CTL_CONST_OFFSET;
Jerome Glisse3ce0a232009-09-08 10:10:24 +1000716 end_reg = 4 * pkt->count + start_reg - 4;
717 if ((start_reg < PACKET3_SET_CTL_CONST_OFFSET) ||
718 (start_reg >= PACKET3_SET_CTL_CONST_END) ||
719 (end_reg >= PACKET3_SET_CTL_CONST_END)) {
720 DRM_ERROR("bad SET_CTL_CONST\n");
721 return -EINVAL;
722 }
723 break;
724 case PACKET3_SET_SAMPLER:
725 if (pkt->count % 3) {
726 DRM_ERROR("bad SET_SAMPLER\n");
727 return -EINVAL;
728 }
Dave Airlieadea4792009-09-25 14:23:47 +1000729 start_reg = (idx_value << 2) + PACKET3_SET_SAMPLER_OFFSET;
Jerome Glisse3ce0a232009-09-08 10:10:24 +1000730 end_reg = 4 * pkt->count + start_reg - 4;
731 if ((start_reg < PACKET3_SET_SAMPLER_OFFSET) ||
732 (start_reg >= PACKET3_SET_SAMPLER_END) ||
733 (end_reg >= PACKET3_SET_SAMPLER_END)) {
734 DRM_ERROR("bad SET_SAMPLER\n");
735 return -EINVAL;
736 }
737 break;
738 case PACKET3_SURFACE_BASE_UPDATE:
739 if (p->family >= CHIP_RV770 || p->family == CHIP_R600) {
740 DRM_ERROR("bad SURFACE_BASE_UPDATE\n");
741 return -EINVAL;
742 }
743 if (pkt->count) {
744 DRM_ERROR("bad SURFACE_BASE_UPDATE\n");
745 return -EINVAL;
746 }
747 break;
748 case PACKET3_NOP:
749 break;
750 default:
751 DRM_ERROR("Packet3 opcode %x not supported\n", pkt->opcode);
752 return -EINVAL;
753 }
754 return 0;
755}
756
757int r600_cs_parse(struct radeon_cs_parser *p)
758{
759 struct radeon_cs_packet pkt;
Jerome Glissec8c15ff2010-01-18 13:01:36 +0100760 struct r600_cs_track *track;
Jerome Glisse3ce0a232009-09-08 10:10:24 +1000761 int r;
762
Jerome Glissec8c15ff2010-01-18 13:01:36 +0100763 track = kzalloc(sizeof(*track), GFP_KERNEL);
764 p->track = track;
Jerome Glisse3ce0a232009-09-08 10:10:24 +1000765 do {
766 r = r600_cs_packet_parse(p, &pkt, p->idx);
767 if (r) {
768 return r;
769 }
770 p->idx += pkt.count + 2;
771 switch (pkt.type) {
772 case PACKET_TYPE0:
773 r = r600_cs_parse_packet0(p, &pkt);
774 break;
775 case PACKET_TYPE2:
776 break;
777 case PACKET_TYPE3:
778 r = r600_packet3_check(p, &pkt);
779 break;
780 default:
781 DRM_ERROR("Unknown packet type %d !\n", pkt.type);
782 return -EINVAL;
783 }
784 if (r) {
785 return r;
786 }
787 } while (p->idx < p->chunks[p->chunk_ib_idx].length_dw);
788#if 0
789 for (r = 0; r < p->ib->length_dw; r++) {
790 printk(KERN_INFO "%05d 0x%08X\n", r, p->ib->ptr[r]);
791 mdelay(1);
792 }
793#endif
794 return 0;
795}
796
797static int r600_cs_parser_relocs_legacy(struct radeon_cs_parser *p)
798{
799 if (p->chunk_relocs_idx == -1) {
800 return 0;
801 }
Julia Lawalle265f39e2009-12-19 08:16:33 +0100802 p->relocs = kzalloc(sizeof(struct radeon_cs_reloc), GFP_KERNEL);
Jerome Glisse3ce0a232009-09-08 10:10:24 +1000803 if (p->relocs == NULL) {
804 return -ENOMEM;
805 }
806 return 0;
807}
808
809/**
810 * cs_parser_fini() - clean parser states
811 * @parser: parser structure holding parsing context.
812 * @error: error number
813 *
814 * If error is set than unvalidate buffer, otherwise just free memory
815 * used by parsing context.
816 **/
817static void r600_cs_parser_fini(struct radeon_cs_parser *parser, int error)
818{
819 unsigned i;
820
821 kfree(parser->relocs);
822 for (i = 0; i < parser->nchunks; i++) {
823 kfree(parser->chunks[i].kdata);
Dave Airlie4c57edba2009-09-28 15:37:25 +1000824 kfree(parser->chunks[i].kpage[0]);
825 kfree(parser->chunks[i].kpage[1]);
Jerome Glisse3ce0a232009-09-08 10:10:24 +1000826 }
827 kfree(parser->chunks);
828 kfree(parser->chunks_array);
829}
830
831int r600_cs_legacy(struct drm_device *dev, void *data, struct drm_file *filp,
832 unsigned family, u32 *ib, int *l)
833{
834 struct radeon_cs_parser parser;
835 struct radeon_cs_chunk *ib_chunk;
836 struct radeon_ib fake_ib;
837 int r;
838
839 /* initialize parser */
840 memset(&parser, 0, sizeof(struct radeon_cs_parser));
841 parser.filp = filp;
Jerome Glissec8c15ff2010-01-18 13:01:36 +0100842 parser.dev = &dev->pdev->dev;
Jerome Glisse3ce0a232009-09-08 10:10:24 +1000843 parser.rdev = NULL;
844 parser.family = family;
845 parser.ib = &fake_ib;
846 fake_ib.ptr = ib;
847 r = radeon_cs_parser_init(&parser, data);
848 if (r) {
849 DRM_ERROR("Failed to initialize parser !\n");
850 r600_cs_parser_fini(&parser, r);
851 return r;
852 }
853 r = r600_cs_parser_relocs_legacy(&parser);
854 if (r) {
855 DRM_ERROR("Failed to parse relocation !\n");
856 r600_cs_parser_fini(&parser, r);
857 return r;
858 }
859 /* Copy the packet into the IB, the parser will read from the
860 * input memory (cached) and write to the IB (which can be
861 * uncached). */
862 ib_chunk = &parser.chunks[parser.chunk_ib_idx];
863 parser.ib->length_dw = ib_chunk->length_dw;
Jerome Glisse3ce0a232009-09-08 10:10:24 +1000864 *l = parser.ib->length_dw;
865 r = r600_cs_parse(&parser);
866 if (r) {
867 DRM_ERROR("Invalid command stream !\n");
868 r600_cs_parser_fini(&parser, r);
869 return r;
870 }
Dave Airlie513bcb42009-09-23 16:56:27 +1000871 r = radeon_cs_finish_pages(&parser);
872 if (r) {
873 DRM_ERROR("Invalid command stream !\n");
874 r600_cs_parser_fini(&parser, r);
875 return r;
876 }
Jerome Glisse3ce0a232009-09-08 10:10:24 +1000877 r600_cs_parser_fini(&parser, r);
878 return r;
879}
880
881void r600_cs_legacy_init(void)
882{
883 r600_cs_packet_next_reloc = &r600_cs_packet_next_reloc_nomm;
884}