xref: /openbmc/linux/drivers/gpu/drm/radeon/r600_cs.c (revision b6dcefde)
1 /*
2  * Copyright 2008 Advanced Micro Devices, Inc.
3  * Copyright 2008 Red Hat Inc.
4  * Copyright 2009 Jerome Glisse.
5  *
6  * Permission is hereby granted, free of charge, to any person obtaining a
7  * copy of this software and associated documentation files (the "Software"),
8  * to deal in the Software without restriction, including without limitation
9  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
10  * and/or sell copies of the Software, and to permit persons to whom the
11  * Software is furnished to do so, subject to the following conditions:
12  *
13  * The above copyright notice and this permission notice shall be included in
14  * all copies or substantial portions of the Software.
15  *
16  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
19  * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
20  * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
21  * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
22  * OTHER DEALINGS IN THE SOFTWARE.
23  *
24  * Authors: Dave Airlie
25  *          Alex Deucher
26  *          Jerome Glisse
27  */
28 #include "drmP.h"
29 #include "radeon.h"
30 #include "r600d.h"
31 
32 static int r600_cs_packet_next_reloc_mm(struct radeon_cs_parser *p,
33 					struct radeon_cs_reloc **cs_reloc);
34 static int r600_cs_packet_next_reloc_nomm(struct radeon_cs_parser *p,
35 					struct radeon_cs_reloc **cs_reloc);
36 typedef int (*next_reloc_t)(struct radeon_cs_parser*, struct radeon_cs_reloc**);
37 static next_reloc_t r600_cs_packet_next_reloc = &r600_cs_packet_next_reloc_mm;
38 
39 struct r600_cs_track {
40 	u32	cb_color0_base_last;
41 };
42 
43 /**
44  * r600_cs_packet_parse() - parse cp packet and point ib index to next packet
45  * @parser:	parser structure holding parsing context.
46  * @pkt:	where to store packet informations
47  *
48  * Assume that chunk_ib_index is properly set. Will return -EINVAL
49  * if packet is bigger than remaining ib size. or if packets is unknown.
50  **/
51 int r600_cs_packet_parse(struct radeon_cs_parser *p,
52 			struct radeon_cs_packet *pkt,
53 			unsigned idx)
54 {
55 	struct radeon_cs_chunk *ib_chunk = &p->chunks[p->chunk_ib_idx];
56 	uint32_t header;
57 
58 	if (idx >= ib_chunk->length_dw) {
59 		DRM_ERROR("Can not parse packet at %d after CS end %d !\n",
60 			  idx, ib_chunk->length_dw);
61 		return -EINVAL;
62 	}
63 	header = radeon_get_ib_value(p, idx);
64 	pkt->idx = idx;
65 	pkt->type = CP_PACKET_GET_TYPE(header);
66 	pkt->count = CP_PACKET_GET_COUNT(header);
67 	pkt->one_reg_wr = 0;
68 	switch (pkt->type) {
69 	case PACKET_TYPE0:
70 		pkt->reg = CP_PACKET0_GET_REG(header);
71 		break;
72 	case PACKET_TYPE3:
73 		pkt->opcode = CP_PACKET3_GET_OPCODE(header);
74 		break;
75 	case PACKET_TYPE2:
76 		pkt->count = -1;
77 		break;
78 	default:
79 		DRM_ERROR("Unknown packet type %d at %d !\n", pkt->type, idx);
80 		return -EINVAL;
81 	}
82 	if ((pkt->count + 1 + pkt->idx) >= ib_chunk->length_dw) {
83 		DRM_ERROR("Packet (%d:%d:%d) end after CS buffer (%d) !\n",
84 			  pkt->idx, pkt->type, pkt->count, ib_chunk->length_dw);
85 		return -EINVAL;
86 	}
87 	return 0;
88 }
89 
90 /**
91  * r600_cs_packet_next_reloc_mm() - parse next packet which should be reloc packet3
92  * @parser:		parser structure holding parsing context.
93  * @data:		pointer to relocation data
94  * @offset_start:	starting offset
95  * @offset_mask:	offset mask (to align start offset on)
96  * @reloc:		reloc informations
97  *
98  * Check next packet is relocation packet3, do bo validation and compute
99  * GPU offset using the provided start.
100  **/
101 static int r600_cs_packet_next_reloc_mm(struct radeon_cs_parser *p,
102 					struct radeon_cs_reloc **cs_reloc)
103 {
104 	struct radeon_cs_chunk *relocs_chunk;
105 	struct radeon_cs_packet p3reloc;
106 	unsigned idx;
107 	int r;
108 
109 	if (p->chunk_relocs_idx == -1) {
110 		DRM_ERROR("No relocation chunk !\n");
111 		return -EINVAL;
112 	}
113 	*cs_reloc = NULL;
114 	relocs_chunk = &p->chunks[p->chunk_relocs_idx];
115 	r = r600_cs_packet_parse(p, &p3reloc, p->idx);
116 	if (r) {
117 		return r;
118 	}
119 	p->idx += p3reloc.count + 2;
120 	if (p3reloc.type != PACKET_TYPE3 || p3reloc.opcode != PACKET3_NOP) {
121 		DRM_ERROR("No packet3 for relocation for packet at %d.\n",
122 			  p3reloc.idx);
123 		return -EINVAL;
124 	}
125 	idx = radeon_get_ib_value(p, p3reloc.idx + 1);
126 	if (idx >= relocs_chunk->length_dw) {
127 		DRM_ERROR("Relocs at %d after relocations chunk end %d !\n",
128 			  idx, relocs_chunk->length_dw);
129 		return -EINVAL;
130 	}
131 	/* FIXME: we assume reloc size is 4 dwords */
132 	*cs_reloc = p->relocs_ptr[(idx / 4)];
133 	return 0;
134 }
135 
136 /**
137  * r600_cs_packet_next_reloc_nomm() - parse next packet which should be reloc packet3
138  * @parser:		parser structure holding parsing context.
139  * @data:		pointer to relocation data
140  * @offset_start:	starting offset
141  * @offset_mask:	offset mask (to align start offset on)
142  * @reloc:		reloc informations
143  *
144  * Check next packet is relocation packet3, do bo validation and compute
145  * GPU offset using the provided start.
146  **/
147 static int r600_cs_packet_next_reloc_nomm(struct radeon_cs_parser *p,
148 					struct radeon_cs_reloc **cs_reloc)
149 {
150 	struct radeon_cs_chunk *relocs_chunk;
151 	struct radeon_cs_packet p3reloc;
152 	unsigned idx;
153 	int r;
154 
155 	if (p->chunk_relocs_idx == -1) {
156 		DRM_ERROR("No relocation chunk !\n");
157 		return -EINVAL;
158 	}
159 	*cs_reloc = NULL;
160 	relocs_chunk = &p->chunks[p->chunk_relocs_idx];
161 	r = r600_cs_packet_parse(p, &p3reloc, p->idx);
162 	if (r) {
163 		return r;
164 	}
165 	p->idx += p3reloc.count + 2;
166 	if (p3reloc.type != PACKET_TYPE3 || p3reloc.opcode != PACKET3_NOP) {
167 		DRM_ERROR("No packet3 for relocation for packet at %d.\n",
168 			  p3reloc.idx);
169 		return -EINVAL;
170 	}
171 	idx = radeon_get_ib_value(p, p3reloc.idx + 1);
172 	if (idx >= relocs_chunk->length_dw) {
173 		DRM_ERROR("Relocs at %d after relocations chunk end %d !\n",
174 			  idx, relocs_chunk->length_dw);
175 		return -EINVAL;
176 	}
177 	*cs_reloc = p->relocs;
178 	(*cs_reloc)->lobj.gpu_offset = (u64)relocs_chunk->kdata[idx + 3] << 32;
179 	(*cs_reloc)->lobj.gpu_offset |= relocs_chunk->kdata[idx + 0];
180 	return 0;
181 }
182 
183 /**
184  * r600_cs_packet_next_is_pkt3_nop() - test if next packet is packet3 nop for reloc
185  * @parser:		parser structure holding parsing context.
186  *
187  * Check next packet is relocation packet3, do bo validation and compute
188  * GPU offset using the provided start.
189  **/
190 static inline int r600_cs_packet_next_is_pkt3_nop(struct radeon_cs_parser *p)
191 {
192 	struct radeon_cs_packet p3reloc;
193 	int r;
194 
195 	r = r600_cs_packet_parse(p, &p3reloc, p->idx);
196 	if (r) {
197 		return 0;
198 	}
199 	if (p3reloc.type != PACKET_TYPE3 || p3reloc.opcode != PACKET3_NOP) {
200 		return 0;
201 	}
202 	return 1;
203 }
204 
205 /**
206  * r600_cs_packet_next_vline() - parse userspace VLINE packet
207  * @parser:		parser structure holding parsing context.
208  *
209  * Userspace sends a special sequence for VLINE waits.
210  * PACKET0 - VLINE_START_END + value
211  * PACKET3 - WAIT_REG_MEM poll vline status reg
212  * RELOC (P3) - crtc_id in reloc.
213  *
214  * This function parses this and relocates the VLINE START END
215  * and WAIT_REG_MEM packets to the correct crtc.
216  * It also detects a switched off crtc and nulls out the
217  * wait in that case.
218  */
219 static int r600_cs_packet_parse_vline(struct radeon_cs_parser *p)
220 {
221 	struct drm_mode_object *obj;
222 	struct drm_crtc *crtc;
223 	struct radeon_crtc *radeon_crtc;
224 	struct radeon_cs_packet p3reloc, wait_reg_mem;
225 	int crtc_id;
226 	int r;
227 	uint32_t header, h_idx, reg, wait_reg_mem_info;
228 	volatile uint32_t *ib;
229 
230 	ib = p->ib->ptr;
231 
232 	/* parse the WAIT_REG_MEM */
233 	r = r600_cs_packet_parse(p, &wait_reg_mem, p->idx);
234 	if (r)
235 		return r;
236 
237 	/* check its a WAIT_REG_MEM */
238 	if (wait_reg_mem.type != PACKET_TYPE3 ||
239 	    wait_reg_mem.opcode != PACKET3_WAIT_REG_MEM) {
240 		DRM_ERROR("vline wait missing WAIT_REG_MEM segment\n");
241 		r = -EINVAL;
242 		return r;
243 	}
244 
245 	wait_reg_mem_info = radeon_get_ib_value(p, wait_reg_mem.idx + 1);
246 	/* bit 4 is reg (0) or mem (1) */
247 	if (wait_reg_mem_info & 0x10) {
248 		DRM_ERROR("vline WAIT_REG_MEM waiting on MEM rather than REG\n");
249 		r = -EINVAL;
250 		return r;
251 	}
252 	/* waiting for value to be equal */
253 	if ((wait_reg_mem_info & 0x7) != 0x3) {
254 		DRM_ERROR("vline WAIT_REG_MEM function not equal\n");
255 		r = -EINVAL;
256 		return r;
257 	}
258 	if ((radeon_get_ib_value(p, wait_reg_mem.idx + 2) << 2) != AVIVO_D1MODE_VLINE_STATUS) {
259 		DRM_ERROR("vline WAIT_REG_MEM bad reg\n");
260 		r = -EINVAL;
261 		return r;
262 	}
263 
264 	if (radeon_get_ib_value(p, wait_reg_mem.idx + 5) != AVIVO_D1MODE_VLINE_STAT) {
265 		DRM_ERROR("vline WAIT_REG_MEM bad bit mask\n");
266 		r = -EINVAL;
267 		return r;
268 	}
269 
270 	/* jump over the NOP */
271 	r = r600_cs_packet_parse(p, &p3reloc, p->idx + wait_reg_mem.count + 2);
272 	if (r)
273 		return r;
274 
275 	h_idx = p->idx - 2;
276 	p->idx += wait_reg_mem.count + 2;
277 	p->idx += p3reloc.count + 2;
278 
279 	header = radeon_get_ib_value(p, h_idx);
280 	crtc_id = radeon_get_ib_value(p, h_idx + 2 + 7 + 1);
281 	reg = CP_PACKET0_GET_REG(header);
282 	mutex_lock(&p->rdev->ddev->mode_config.mutex);
283 	obj = drm_mode_object_find(p->rdev->ddev, crtc_id, DRM_MODE_OBJECT_CRTC);
284 	if (!obj) {
285 		DRM_ERROR("cannot find crtc %d\n", crtc_id);
286 		r = -EINVAL;
287 		goto out;
288 	}
289 	crtc = obj_to_crtc(obj);
290 	radeon_crtc = to_radeon_crtc(crtc);
291 	crtc_id = radeon_crtc->crtc_id;
292 
293 	if (!crtc->enabled) {
294 		/* if the CRTC isn't enabled - we need to nop out the WAIT_REG_MEM */
295 		ib[h_idx + 2] = PACKET2(0);
296 		ib[h_idx + 3] = PACKET2(0);
297 		ib[h_idx + 4] = PACKET2(0);
298 		ib[h_idx + 5] = PACKET2(0);
299 		ib[h_idx + 6] = PACKET2(0);
300 		ib[h_idx + 7] = PACKET2(0);
301 		ib[h_idx + 8] = PACKET2(0);
302 	} else if (crtc_id == 1) {
303 		switch (reg) {
304 		case AVIVO_D1MODE_VLINE_START_END:
305 			header &= ~R600_CP_PACKET0_REG_MASK;
306 			header |= AVIVO_D2MODE_VLINE_START_END >> 2;
307 			break;
308 		default:
309 			DRM_ERROR("unknown crtc reloc\n");
310 			r = -EINVAL;
311 			goto out;
312 		}
313 		ib[h_idx] = header;
314 		ib[h_idx + 4] = AVIVO_D2MODE_VLINE_STATUS >> 2;
315 	}
316 out:
317 	mutex_unlock(&p->rdev->ddev->mode_config.mutex);
318 	return r;
319 }
320 
321 static int r600_packet0_check(struct radeon_cs_parser *p,
322 				struct radeon_cs_packet *pkt,
323 				unsigned idx, unsigned reg)
324 {
325 	int r;
326 
327 	switch (reg) {
328 	case AVIVO_D1MODE_VLINE_START_END:
329 		r = r600_cs_packet_parse_vline(p);
330 		if (r) {
331 			DRM_ERROR("No reloc for ib[%d]=0x%04X\n",
332 					idx, reg);
333 			return r;
334 		}
335 		break;
336 	default:
337 		printk(KERN_ERR "Forbidden register 0x%04X in cs at %d\n",
338 		       reg, idx);
339 		return -EINVAL;
340 	}
341 	return 0;
342 }
343 
344 static int r600_cs_parse_packet0(struct radeon_cs_parser *p,
345 				struct radeon_cs_packet *pkt)
346 {
347 	unsigned reg, i;
348 	unsigned idx;
349 	int r;
350 
351 	idx = pkt->idx + 1;
352 	reg = pkt->reg;
353 	for (i = 0; i <= pkt->count; i++, idx++, reg += 4) {
354 		r = r600_packet0_check(p, pkt, idx, reg);
355 		if (r) {
356 			return r;
357 		}
358 	}
359 	return 0;
360 }
361 
362 static int r600_packet3_check(struct radeon_cs_parser *p,
363 				struct radeon_cs_packet *pkt)
364 {
365 	struct radeon_cs_reloc *reloc;
366 	struct r600_cs_track *track;
367 	volatile u32 *ib;
368 	unsigned idx;
369 	unsigned i;
370 	unsigned start_reg, end_reg, reg;
371 	int r;
372 	u32 idx_value;
373 
374 	track = (struct r600_cs_track *)p->track;
375 	ib = p->ib->ptr;
376 	idx = pkt->idx + 1;
377 	idx_value = radeon_get_ib_value(p, idx);
378 
379 	switch (pkt->opcode) {
380 	case PACKET3_START_3D_CMDBUF:
381 		if (p->family >= CHIP_RV770 || pkt->count) {
382 			DRM_ERROR("bad START_3D\n");
383 			return -EINVAL;
384 		}
385 		break;
386 	case PACKET3_CONTEXT_CONTROL:
387 		if (pkt->count != 1) {
388 			DRM_ERROR("bad CONTEXT_CONTROL\n");
389 			return -EINVAL;
390 		}
391 		break;
392 	case PACKET3_INDEX_TYPE:
393 	case PACKET3_NUM_INSTANCES:
394 		if (pkt->count) {
395 			DRM_ERROR("bad INDEX_TYPE/NUM_INSTANCES\n");
396 			return -EINVAL;
397 		}
398 		break;
399 	case PACKET3_DRAW_INDEX:
400 		if (pkt->count != 3) {
401 			DRM_ERROR("bad DRAW_INDEX\n");
402 			return -EINVAL;
403 		}
404 		r = r600_cs_packet_next_reloc(p, &reloc);
405 		if (r) {
406 			DRM_ERROR("bad DRAW_INDEX\n");
407 			return -EINVAL;
408 		}
409 		ib[idx+0] = idx_value + (u32)(reloc->lobj.gpu_offset & 0xffffffff);
410 		ib[idx+1] += upper_32_bits(reloc->lobj.gpu_offset) & 0xff;
411 		break;
412 	case PACKET3_DRAW_INDEX_AUTO:
413 		if (pkt->count != 1) {
414 			DRM_ERROR("bad DRAW_INDEX_AUTO\n");
415 			return -EINVAL;
416 		}
417 		break;
418 	case PACKET3_DRAW_INDEX_IMMD_BE:
419 	case PACKET3_DRAW_INDEX_IMMD:
420 		if (pkt->count < 2) {
421 			DRM_ERROR("bad DRAW_INDEX_IMMD\n");
422 			return -EINVAL;
423 		}
424 		break;
425 	case PACKET3_WAIT_REG_MEM:
426 		if (pkt->count != 5) {
427 			DRM_ERROR("bad WAIT_REG_MEM\n");
428 			return -EINVAL;
429 		}
430 		/* bit 4 is reg (0) or mem (1) */
431 		if (idx_value & 0x10) {
432 			r = r600_cs_packet_next_reloc(p, &reloc);
433 			if (r) {
434 				DRM_ERROR("bad WAIT_REG_MEM\n");
435 				return -EINVAL;
436 			}
437 			ib[idx+1] += (u32)(reloc->lobj.gpu_offset & 0xffffffff);
438 			ib[idx+2] += upper_32_bits(reloc->lobj.gpu_offset) & 0xff;
439 		}
440 		break;
441 	case PACKET3_SURFACE_SYNC:
442 		if (pkt->count != 3) {
443 			DRM_ERROR("bad SURFACE_SYNC\n");
444 			return -EINVAL;
445 		}
446 		/* 0xffffffff/0x0 is flush all cache flag */
447 		if (radeon_get_ib_value(p, idx + 1) != 0xffffffff ||
448 		    radeon_get_ib_value(p, idx + 2) != 0) {
449 			r = r600_cs_packet_next_reloc(p, &reloc);
450 			if (r) {
451 				DRM_ERROR("bad SURFACE_SYNC\n");
452 				return -EINVAL;
453 			}
454 			ib[idx+2] += (u32)((reloc->lobj.gpu_offset >> 8) & 0xffffffff);
455 		}
456 		break;
457 	case PACKET3_EVENT_WRITE:
458 		if (pkt->count != 2 && pkt->count != 0) {
459 			DRM_ERROR("bad EVENT_WRITE\n");
460 			return -EINVAL;
461 		}
462 		if (pkt->count) {
463 			r = r600_cs_packet_next_reloc(p, &reloc);
464 			if (r) {
465 				DRM_ERROR("bad EVENT_WRITE\n");
466 				return -EINVAL;
467 			}
468 			ib[idx+1] += (u32)(reloc->lobj.gpu_offset & 0xffffffff);
469 			ib[idx+2] += upper_32_bits(reloc->lobj.gpu_offset) & 0xff;
470 		}
471 		break;
472 	case PACKET3_EVENT_WRITE_EOP:
473 		if (pkt->count != 4) {
474 			DRM_ERROR("bad EVENT_WRITE_EOP\n");
475 			return -EINVAL;
476 		}
477 		r = r600_cs_packet_next_reloc(p, &reloc);
478 		if (r) {
479 			DRM_ERROR("bad EVENT_WRITE\n");
480 			return -EINVAL;
481 		}
482 		ib[idx+1] += (u32)(reloc->lobj.gpu_offset & 0xffffffff);
483 		ib[idx+2] += upper_32_bits(reloc->lobj.gpu_offset) & 0xff;
484 		break;
485 	case PACKET3_SET_CONFIG_REG:
486 		start_reg = (idx_value << 2) + PACKET3_SET_CONFIG_REG_OFFSET;
487 		end_reg = 4 * pkt->count + start_reg - 4;
488 		if ((start_reg < PACKET3_SET_CONFIG_REG_OFFSET) ||
489 		    (start_reg >= PACKET3_SET_CONFIG_REG_END) ||
490 		    (end_reg >= PACKET3_SET_CONFIG_REG_END)) {
491 			DRM_ERROR("bad PACKET3_SET_CONFIG_REG\n");
492 			return -EINVAL;
493 		}
494 		for (i = 0; i < pkt->count; i++) {
495 			reg = start_reg + (4 * i);
496 			switch (reg) {
497 			case SQ_ESGS_RING_BASE:
498 			case SQ_GSVS_RING_BASE:
499 			case SQ_ESTMP_RING_BASE:
500 			case SQ_GSTMP_RING_BASE:
501 			case SQ_VSTMP_RING_BASE:
502 			case SQ_PSTMP_RING_BASE:
503 			case SQ_FBUF_RING_BASE:
504 			case SQ_REDUC_RING_BASE:
505 			case SX_MEMORY_EXPORT_BASE:
506 				r = r600_cs_packet_next_reloc(p, &reloc);
507 				if (r) {
508 					DRM_ERROR("bad SET_CONFIG_REG "
509 							"0x%04X\n", reg);
510 					return -EINVAL;
511 				}
512 				ib[idx+1+i] += (u32)((reloc->lobj.gpu_offset >> 8) & 0xffffffff);
513 				break;
514 			case CP_COHER_BASE:
515 				/* use PACKET3_SURFACE_SYNC */
516 				return -EINVAL;
517 			default:
518 				break;
519 			}
520 		}
521 		break;
522 	case PACKET3_SET_CONTEXT_REG:
523 		start_reg = (idx_value << 2) + PACKET3_SET_CONTEXT_REG_OFFSET;
524 		end_reg = 4 * pkt->count + start_reg - 4;
525 		if ((start_reg < PACKET3_SET_CONTEXT_REG_OFFSET) ||
526 		    (start_reg >= PACKET3_SET_CONTEXT_REG_END) ||
527 		    (end_reg >= PACKET3_SET_CONTEXT_REG_END)) {
528 			DRM_ERROR("bad PACKET3_SET_CONTEXT_REG\n");
529 			return -EINVAL;
530 		}
531 		for (i = 0; i < pkt->count; i++) {
532 			reg = start_reg + (4 * i);
533 			switch (reg) {
534 			/* This register were added late, there is userspace
535 			 * which does provide relocation for those but set
536 			 * 0 offset. In order to avoid breaking old userspace
537 			 * we detect this and set address to point to last
538 			 * CB_COLOR0_BASE, note that if userspace doesn't set
539 			 * CB_COLOR0_BASE before this register we will report
540 			 * error. Old userspace always set CB_COLOR0_BASE
541 			 * before any of this.
542 			 */
543 			case R_0280E0_CB_COLOR0_FRAG:
544 			case R_0280E4_CB_COLOR1_FRAG:
545 			case R_0280E8_CB_COLOR2_FRAG:
546 			case R_0280EC_CB_COLOR3_FRAG:
547 			case R_0280F0_CB_COLOR4_FRAG:
548 			case R_0280F4_CB_COLOR5_FRAG:
549 			case R_0280F8_CB_COLOR6_FRAG:
550 			case R_0280FC_CB_COLOR7_FRAG:
551 			case R_0280C0_CB_COLOR0_TILE:
552 			case R_0280C4_CB_COLOR1_TILE:
553 			case R_0280C8_CB_COLOR2_TILE:
554 			case R_0280CC_CB_COLOR3_TILE:
555 			case R_0280D0_CB_COLOR4_TILE:
556 			case R_0280D4_CB_COLOR5_TILE:
557 			case R_0280D8_CB_COLOR6_TILE:
558 			case R_0280DC_CB_COLOR7_TILE:
559 				if (!r600_cs_packet_next_is_pkt3_nop(p)) {
560 					if (!track->cb_color0_base_last) {
561 						dev_err(p->dev, "Broken old userspace ? no cb_color0_base supplied before trying to write 0x%08X\n", reg);
562 						return -EINVAL;
563 					}
564 					ib[idx+1+i] = track->cb_color0_base_last;
565 					printk_once(KERN_WARNING "radeon: You have old & broken userspace "
566 						"please consider updating mesa & xf86-video-ati\n");
567 				} else {
568 					r = r600_cs_packet_next_reloc(p, &reloc);
569 					if (r) {
570 						dev_err(p->dev, "bad SET_CONTEXT_REG 0x%04X\n", reg);
571 						return -EINVAL;
572 					}
573 					ib[idx+1+i] += (u32)((reloc->lobj.gpu_offset >> 8) & 0xffffffff);
574 				}
575 				break;
576 			case DB_DEPTH_BASE:
577 			case DB_HTILE_DATA_BASE:
578 			case CB_COLOR0_BASE:
579 				r = r600_cs_packet_next_reloc(p, &reloc);
580 				if (r) {
581 					DRM_ERROR("bad SET_CONTEXT_REG "
582 							"0x%04X\n", reg);
583 					return -EINVAL;
584 				}
585 				ib[idx+1+i] += (u32)((reloc->lobj.gpu_offset >> 8) & 0xffffffff);
586 				track->cb_color0_base_last = ib[idx+1+i];
587 				break;
588 			case CB_COLOR1_BASE:
589 			case CB_COLOR2_BASE:
590 			case CB_COLOR3_BASE:
591 			case CB_COLOR4_BASE:
592 			case CB_COLOR5_BASE:
593 			case CB_COLOR6_BASE:
594 			case CB_COLOR7_BASE:
595 			case SQ_PGM_START_FS:
596 			case SQ_PGM_START_ES:
597 			case SQ_PGM_START_VS:
598 			case SQ_PGM_START_GS:
599 			case SQ_PGM_START_PS:
600 				r = r600_cs_packet_next_reloc(p, &reloc);
601 				if (r) {
602 					DRM_ERROR("bad SET_CONTEXT_REG "
603 							"0x%04X\n", reg);
604 					return -EINVAL;
605 				}
606 				ib[idx+1+i] += (u32)((reloc->lobj.gpu_offset >> 8) & 0xffffffff);
607 				break;
608 			case VGT_DMA_BASE:
609 			case VGT_DMA_BASE_HI:
610 				/* These should be handled by DRAW_INDEX packet 3 */
611 			case VGT_STRMOUT_BASE_OFFSET_0:
612 			case VGT_STRMOUT_BASE_OFFSET_1:
613 			case VGT_STRMOUT_BASE_OFFSET_2:
614 			case VGT_STRMOUT_BASE_OFFSET_3:
615 			case VGT_STRMOUT_BASE_OFFSET_HI_0:
616 			case VGT_STRMOUT_BASE_OFFSET_HI_1:
617 			case VGT_STRMOUT_BASE_OFFSET_HI_2:
618 			case VGT_STRMOUT_BASE_OFFSET_HI_3:
619 			case VGT_STRMOUT_BUFFER_BASE_0:
620 			case VGT_STRMOUT_BUFFER_BASE_1:
621 			case VGT_STRMOUT_BUFFER_BASE_2:
622 			case VGT_STRMOUT_BUFFER_BASE_3:
623 			case VGT_STRMOUT_BUFFER_OFFSET_0:
624 			case VGT_STRMOUT_BUFFER_OFFSET_1:
625 			case VGT_STRMOUT_BUFFER_OFFSET_2:
626 			case VGT_STRMOUT_BUFFER_OFFSET_3:
627 				/* These should be handled by STRMOUT_BUFFER packet 3 */
628 				DRM_ERROR("bad context reg: 0x%08x\n", reg);
629 				return -EINVAL;
630 			default:
631 				break;
632 			}
633 		}
634 		break;
635 	case PACKET3_SET_RESOURCE:
636 		if (pkt->count % 7) {
637 			DRM_ERROR("bad SET_RESOURCE\n");
638 			return -EINVAL;
639 		}
640 		start_reg = (idx_value << 2) + PACKET3_SET_RESOURCE_OFFSET;
641 		end_reg = 4 * pkt->count + start_reg - 4;
642 		if ((start_reg < PACKET3_SET_RESOURCE_OFFSET) ||
643 		    (start_reg >= PACKET3_SET_RESOURCE_END) ||
644 		    (end_reg >= PACKET3_SET_RESOURCE_END)) {
645 			DRM_ERROR("bad SET_RESOURCE\n");
646 			return -EINVAL;
647 		}
648 		for (i = 0; i < (pkt->count / 7); i++) {
649 			switch (G__SQ_VTX_CONSTANT_TYPE(radeon_get_ib_value(p, idx+(i*7)+6+1))) {
650 			case SQ_TEX_VTX_VALID_TEXTURE:
651 				/* tex base */
652 				r = r600_cs_packet_next_reloc(p, &reloc);
653 				if (r) {
654 					DRM_ERROR("bad SET_RESOURCE\n");
655 					return -EINVAL;
656 				}
657 				ib[idx+1+(i*7)+2] += (u32)((reloc->lobj.gpu_offset >> 8) & 0xffffffff);
658 				/* tex mip base */
659 				r = r600_cs_packet_next_reloc(p, &reloc);
660 				if (r) {
661 					DRM_ERROR("bad SET_RESOURCE\n");
662 					return -EINVAL;
663 				}
664 				ib[idx+1+(i*7)+3] += (u32)((reloc->lobj.gpu_offset >> 8) & 0xffffffff);
665 				break;
666 			case SQ_TEX_VTX_VALID_BUFFER:
667 				/* vtx base */
668 				r = r600_cs_packet_next_reloc(p, &reloc);
669 				if (r) {
670 					DRM_ERROR("bad SET_RESOURCE\n");
671 					return -EINVAL;
672 				}
673 				ib[idx+1+(i*7)+0] += (u32)((reloc->lobj.gpu_offset) & 0xffffffff);
674 				ib[idx+1+(i*7)+2] += upper_32_bits(reloc->lobj.gpu_offset) & 0xff;
675 				break;
676 			case SQ_TEX_VTX_INVALID_TEXTURE:
677 			case SQ_TEX_VTX_INVALID_BUFFER:
678 			default:
679 				DRM_ERROR("bad SET_RESOURCE\n");
680 				return -EINVAL;
681 			}
682 		}
683 		break;
684 	case PACKET3_SET_ALU_CONST:
685 		start_reg = (idx_value << 2) + PACKET3_SET_ALU_CONST_OFFSET;
686 		end_reg = 4 * pkt->count + start_reg - 4;
687 		if ((start_reg < PACKET3_SET_ALU_CONST_OFFSET) ||
688 		    (start_reg >= PACKET3_SET_ALU_CONST_END) ||
689 		    (end_reg >= PACKET3_SET_ALU_CONST_END)) {
690 			DRM_ERROR("bad SET_ALU_CONST\n");
691 			return -EINVAL;
692 		}
693 		break;
694 	case PACKET3_SET_BOOL_CONST:
695 		start_reg = (idx_value << 2) + PACKET3_SET_BOOL_CONST_OFFSET;
696 		end_reg = 4 * pkt->count + start_reg - 4;
697 		if ((start_reg < PACKET3_SET_BOOL_CONST_OFFSET) ||
698 		    (start_reg >= PACKET3_SET_BOOL_CONST_END) ||
699 		    (end_reg >= PACKET3_SET_BOOL_CONST_END)) {
700 			DRM_ERROR("bad SET_BOOL_CONST\n");
701 			return -EINVAL;
702 		}
703 		break;
704 	case PACKET3_SET_LOOP_CONST:
705 		start_reg = (idx_value << 2) + PACKET3_SET_LOOP_CONST_OFFSET;
706 		end_reg = 4 * pkt->count + start_reg - 4;
707 		if ((start_reg < PACKET3_SET_LOOP_CONST_OFFSET) ||
708 		    (start_reg >= PACKET3_SET_LOOP_CONST_END) ||
709 		    (end_reg >= PACKET3_SET_LOOP_CONST_END)) {
710 			DRM_ERROR("bad SET_LOOP_CONST\n");
711 			return -EINVAL;
712 		}
713 		break;
714 	case PACKET3_SET_CTL_CONST:
715 		start_reg = (idx_value << 2) + PACKET3_SET_CTL_CONST_OFFSET;
716 		end_reg = 4 * pkt->count + start_reg - 4;
717 		if ((start_reg < PACKET3_SET_CTL_CONST_OFFSET) ||
718 		    (start_reg >= PACKET3_SET_CTL_CONST_END) ||
719 		    (end_reg >= PACKET3_SET_CTL_CONST_END)) {
720 			DRM_ERROR("bad SET_CTL_CONST\n");
721 			return -EINVAL;
722 		}
723 		break;
724 	case PACKET3_SET_SAMPLER:
725 		if (pkt->count % 3) {
726 			DRM_ERROR("bad SET_SAMPLER\n");
727 			return -EINVAL;
728 		}
729 		start_reg = (idx_value << 2) + PACKET3_SET_SAMPLER_OFFSET;
730 		end_reg = 4 * pkt->count + start_reg - 4;
731 		if ((start_reg < PACKET3_SET_SAMPLER_OFFSET) ||
732 		    (start_reg >= PACKET3_SET_SAMPLER_END) ||
733 		    (end_reg >= PACKET3_SET_SAMPLER_END)) {
734 			DRM_ERROR("bad SET_SAMPLER\n");
735 			return -EINVAL;
736 		}
737 		break;
738 	case PACKET3_SURFACE_BASE_UPDATE:
739 		if (p->family >= CHIP_RV770 || p->family == CHIP_R600) {
740 			DRM_ERROR("bad SURFACE_BASE_UPDATE\n");
741 			return -EINVAL;
742 		}
743 		if (pkt->count) {
744 			DRM_ERROR("bad SURFACE_BASE_UPDATE\n");
745 			return -EINVAL;
746 		}
747 		break;
748 	case PACKET3_NOP:
749 		break;
750 	default:
751 		DRM_ERROR("Packet3 opcode %x not supported\n", pkt->opcode);
752 		return -EINVAL;
753 	}
754 	return 0;
755 }
756 
757 int r600_cs_parse(struct radeon_cs_parser *p)
758 {
759 	struct radeon_cs_packet pkt;
760 	struct r600_cs_track *track;
761 	int r;
762 
763 	track = kzalloc(sizeof(*track), GFP_KERNEL);
764 	p->track = track;
765 	do {
766 		r = r600_cs_packet_parse(p, &pkt, p->idx);
767 		if (r) {
768 			return r;
769 		}
770 		p->idx += pkt.count + 2;
771 		switch (pkt.type) {
772 		case PACKET_TYPE0:
773 			r = r600_cs_parse_packet0(p, &pkt);
774 			break;
775 		case PACKET_TYPE2:
776 			break;
777 		case PACKET_TYPE3:
778 			r = r600_packet3_check(p, &pkt);
779 			break;
780 		default:
781 			DRM_ERROR("Unknown packet type %d !\n", pkt.type);
782 			return -EINVAL;
783 		}
784 		if (r) {
785 			return r;
786 		}
787 	} while (p->idx < p->chunks[p->chunk_ib_idx].length_dw);
788 #if 0
789 	for (r = 0; r < p->ib->length_dw; r++) {
790 		printk(KERN_INFO "%05d  0x%08X\n", r, p->ib->ptr[r]);
791 		mdelay(1);
792 	}
793 #endif
794 	return 0;
795 }
796 
797 static int r600_cs_parser_relocs_legacy(struct radeon_cs_parser *p)
798 {
799 	if (p->chunk_relocs_idx == -1) {
800 		return 0;
801 	}
802 	p->relocs = kzalloc(sizeof(struct radeon_cs_reloc), GFP_KERNEL);
803 	if (p->relocs == NULL) {
804 		return -ENOMEM;
805 	}
806 	return 0;
807 }
808 
809 /**
810  * cs_parser_fini() - clean parser states
811  * @parser:	parser structure holding parsing context.
812  * @error:	error number
813  *
814  * If error is set than unvalidate buffer, otherwise just free memory
815  * used by parsing context.
816  **/
817 static void r600_cs_parser_fini(struct radeon_cs_parser *parser, int error)
818 {
819 	unsigned i;
820 
821 	kfree(parser->relocs);
822 	for (i = 0; i < parser->nchunks; i++) {
823 		kfree(parser->chunks[i].kdata);
824 		kfree(parser->chunks[i].kpage[0]);
825 		kfree(parser->chunks[i].kpage[1]);
826 	}
827 	kfree(parser->chunks);
828 	kfree(parser->chunks_array);
829 }
830 
831 int r600_cs_legacy(struct drm_device *dev, void *data, struct drm_file *filp,
832 			unsigned family, u32 *ib, int *l)
833 {
834 	struct radeon_cs_parser parser;
835 	struct radeon_cs_chunk *ib_chunk;
836 	struct radeon_ib	fake_ib;
837 	int r;
838 
839 	/* initialize parser */
840 	memset(&parser, 0, sizeof(struct radeon_cs_parser));
841 	parser.filp = filp;
842 	parser.dev = &dev->pdev->dev;
843 	parser.rdev = NULL;
844 	parser.family = family;
845 	parser.ib = &fake_ib;
846 	fake_ib.ptr = ib;
847 	r = radeon_cs_parser_init(&parser, data);
848 	if (r) {
849 		DRM_ERROR("Failed to initialize parser !\n");
850 		r600_cs_parser_fini(&parser, r);
851 		return r;
852 	}
853 	r = r600_cs_parser_relocs_legacy(&parser);
854 	if (r) {
855 		DRM_ERROR("Failed to parse relocation !\n");
856 		r600_cs_parser_fini(&parser, r);
857 		return r;
858 	}
859 	/* Copy the packet into the IB, the parser will read from the
860 	 * input memory (cached) and write to the IB (which can be
861 	 * uncached). */
862 	ib_chunk = &parser.chunks[parser.chunk_ib_idx];
863 	parser.ib->length_dw = ib_chunk->length_dw;
864 	*l = parser.ib->length_dw;
865 	r = r600_cs_parse(&parser);
866 	if (r) {
867 		DRM_ERROR("Invalid command stream !\n");
868 		r600_cs_parser_fini(&parser, r);
869 		return r;
870 	}
871 	r = radeon_cs_finish_pages(&parser);
872 	if (r) {
873 		DRM_ERROR("Invalid command stream !\n");
874 		r600_cs_parser_fini(&parser, r);
875 		return r;
876 	}
877 	r600_cs_parser_fini(&parser, r);
878 	return r;
879 }
880 
881 void r600_cs_legacy_init(void)
882 {
883 	r600_cs_packet_next_reloc = &r600_cs_packet_next_reloc_nomm;
884 }
885