xref: /openbmc/linux/drivers/video/fbdev/kyro/STG4000OverlayDevice.c (revision ead5d1f4d877e92c051e1a1ade623d0d30e71619)
1 /*
2  *  linux/drivers/video/kyro/STG4000OverlayDevice.c
3  *
4  *  Copyright (C) 2000 Imagination Technologies Ltd
5  *  Copyright (C) 2002 STMicroelectronics
6  *
7  * This file is subject to the terms and conditions of the GNU General Public
8  * License.  See the file COPYING in the main directory of this archive
9  * for more details.
10  */
11 
12 #include <linux/kernel.h>
13 #include <linux/errno.h>
14 #include <linux/types.h>
15 
16 #include "STG4000Reg.h"
17 #include "STG4000Interface.h"
18 
19 /* HW Defines */
20 
21 #define STG4000_NO_SCALING    0x800
22 #define STG4000_NO_DECIMATION 0xFFFFFFFF
23 
24 /* Primary surface */
25 #define STG4000_PRIM_NUM_PIX   5
26 #define STG4000_PRIM_ALIGN     4
27 #define STG4000_PRIM_ADDR_BITS 20
28 
29 #define STG4000_PRIM_MIN_WIDTH  640
30 #define STG4000_PRIM_MAX_WIDTH  1600
31 #define STG4000_PRIM_MIN_HEIGHT 480
32 #define STG4000_PRIM_MAX_HEIGHT 1200
33 
34 /* Overlay surface */
35 #define STG4000_OVRL_NUM_PIX   4
36 #define STG4000_OVRL_ALIGN     2
37 #define STG4000_OVRL_ADDR_BITS 20
38 #define STG4000_OVRL_NUM_MODES 5
39 
40 #define STG4000_OVRL_MIN_WIDTH  0
41 #define STG4000_OVRL_MAX_WIDTH  720
42 #define STG4000_OVRL_MIN_HEIGHT 0
43 #define STG4000_OVRL_MAX_HEIGHT 576
44 
45 /* Decimation and Scaling */
46 static u32 adwDecim8[33] = {
47 	    0xffffffff, 0xfffeffff, 0xffdffbff, 0xfefefeff, 0xfdf7efbf,
48 	    0xfbdf7bdf, 0xf7bbddef, 0xeeeeeeef, 0xeeddbb77, 0xedb76db7,
49 	    0xdb6db6db, 0xdb5b5b5b, 0xdab5ad6b, 0xd5ab55ab, 0xd555aaab,
50 	    0xaaaaaaab, 0xaaaa5555, 0xaa952a55, 0xa94a5295, 0xa5252525,
51 	    0xa4924925, 0x92491249, 0x91224489, 0x91111111, 0x90884211,
52 	    0x88410821, 0x88102041, 0x81010101, 0x80800801, 0x80010001,
53 	    0x80000001, 0x00000001, 0x00000000
54 };
55 
56 typedef struct _OVRL_SRC_DEST {
57 	/*clipped on-screen pixel position of overlay */
58 	u32 ulDstX1;
59 	u32 ulDstY1;
60 	u32 ulDstX2;
61 	u32 ulDstY2;
62 
63 	/*clipped pixel pos of source data within buffer thses need to be 128 bit word aligned */
64 	u32 ulSrcX1;
65 	u32 ulSrcY1;
66 	u32 ulSrcX2;
67 	u32 ulSrcY2;
68 
69 	/* on-screen pixel position of overlay */
70 	s32 lDstX1;
71 	s32 lDstY1;
72 	s32 lDstX2;
73 	s32 lDstY2;
74 } OVRL_SRC_DEST;
75 
76 static u32 ovlWidth, ovlHeight, ovlStride;
77 static int ovlLinear;
78 
ResetOverlayRegisters(volatile STG4000REG __iomem * pSTGReg)79 void ResetOverlayRegisters(volatile STG4000REG __iomem *pSTGReg)
80 {
81 	u32 tmp;
82 
83 	/* Set Overlay address to default */
84 	tmp = STG_READ_REG(DACOverlayAddr);
85 	CLEAR_BITS_FRM_TO(0, 20);
86 	CLEAR_BIT(31);
87 	STG_WRITE_REG(DACOverlayAddr, tmp);
88 
89 	/* Set Overlay U address */
90 	tmp = STG_READ_REG(DACOverlayUAddr);
91 	CLEAR_BITS_FRM_TO(0, 20);
92 	STG_WRITE_REG(DACOverlayUAddr, tmp);
93 
94 	/* Set Overlay V address */
95 	tmp = STG_READ_REG(DACOverlayVAddr);
96 	CLEAR_BITS_FRM_TO(0, 20);
97 	STG_WRITE_REG(DACOverlayVAddr, tmp);
98 
99 	/* Set Overlay Size */
100 	tmp = STG_READ_REG(DACOverlaySize);
101 	CLEAR_BITS_FRM_TO(0, 10);
102 	CLEAR_BITS_FRM_TO(12, 31);
103 	STG_WRITE_REG(DACOverlaySize, tmp);
104 
105 	/* Set Overlay Vt Decimation */
106 	tmp = STG4000_NO_DECIMATION;
107 	STG_WRITE_REG(DACOverlayVtDec, tmp);
108 
109 	/* Set Overlay format to default value */
110 	tmp = STG_READ_REG(DACPixelFormat);
111 	CLEAR_BITS_FRM_TO(4, 7);
112 	CLEAR_BITS_FRM_TO(16, 22);
113 	STG_WRITE_REG(DACPixelFormat, tmp);
114 
115 	/* Set Vertical scaling to default */
116 	tmp = STG_READ_REG(DACVerticalScal);
117 	CLEAR_BITS_FRM_TO(0, 11);
118 	CLEAR_BITS_FRM_TO(16, 22);
119 	tmp |= STG4000_NO_SCALING;	/* Set to no scaling */
120 	STG_WRITE_REG(DACVerticalScal, tmp);
121 
122 	/* Set Horizontal Scaling to default */
123 	tmp = STG_READ_REG(DACHorizontalScal);
124 	CLEAR_BITS_FRM_TO(0, 11);
125 	CLEAR_BITS_FRM_TO(16, 17);
126 	tmp |= STG4000_NO_SCALING;	/* Set to no scaling */
127 	STG_WRITE_REG(DACHorizontalScal, tmp);
128 
129 	/* Set Blend mode to Alpha Blend */
130 	/* ????? SG 08/11/2001 Surely this isn't the alpha blend mode,
131 	   hopefully its overwrite
132 	 */
133 	tmp = STG_READ_REG(DACBlendCtrl);
134 	CLEAR_BITS_FRM_TO(0, 30);
135 	tmp = (GRAPHICS_MODE << 28);
136 	STG_WRITE_REG(DACBlendCtrl, tmp);
137 
138 }
139 
CreateOverlaySurface(volatile STG4000REG __iomem * pSTGReg,u32 inWidth,u32 inHeight,int bLinear,u32 ulOverlayOffset,u32 * retStride,u32 * retUVStride)140 int CreateOverlaySurface(volatile STG4000REG __iomem *pSTGReg,
141 			 u32 inWidth,
142 			 u32 inHeight,
143 			 int bLinear,
144 			 u32 ulOverlayOffset,
145 			 u32 * retStride, u32 * retUVStride)
146 {
147 	u32 tmp;
148 	u32 ulStride;
149 
150 	if (inWidth > STG4000_OVRL_MAX_WIDTH ||
151 	    inHeight > STG4000_OVRL_MAX_HEIGHT) {
152 		return -EINVAL;
153 	}
154 
155 	/* Stride in 16 byte words - 16Bpp */
156 	if (bLinear) {
157 		/* Format is 16bits so num 16 byte words is width/8 */
158 		if ((inWidth & 0x7) == 0) {	/* inWidth % 8 */
159 			ulStride = (inWidth / 8);
160 		} else {
161 			/* Round up to next 16byte boundary */
162 			ulStride = ((inWidth + 8) / 8);
163 		}
164 	} else {
165 		/* Y component is 8bits so num 16 byte words is width/16 */
166 		if ((inWidth & 0xf) == 0) {	/* inWidth % 16 */
167 			ulStride = (inWidth / 16);
168 		} else {
169 			/* Round up to next 16byte boundary */
170 			ulStride = ((inWidth + 16) / 16);
171 		}
172 	}
173 
174 
175 	/* Set Overlay address and Format mode */
176 	tmp = STG_READ_REG(DACOverlayAddr);
177 	CLEAR_BITS_FRM_TO(0, 20);
178 	if (bLinear) {
179 		CLEAR_BIT(31);	/* Overlay format to Linear */
180 	} else {
181 		tmp |= SET_BIT(31);	/* Overlay format to Planer */
182 	}
183 
184 	/* Only bits 24:4 of the Overlay address */
185 	tmp |= (ulOverlayOffset >> 4);
186 	STG_WRITE_REG(DACOverlayAddr, tmp);
187 
188 	if (!bLinear) {
189 		u32 uvSize =
190 		    (inWidth & 0x1) ? (inWidth + 1 / 2) : (inWidth / 2);
191 		u32 uvStride;
192 		u32 ulOffset;
193 		/* Y component is 8bits so num 32 byte words is width/32 */
194 		if ((uvSize & 0xf) == 0) {	/* inWidth % 16 */
195 			uvStride = (uvSize / 16);
196 		} else {
197 			/* Round up to next 32byte boundary */
198 			uvStride = ((uvSize + 16) / 16);
199 		}
200 
201 		ulOffset = ulOverlayOffset + (inHeight * (ulStride * 16));
202 		/* Align U,V data to 32byte boundary */
203 		if ((ulOffset & 0x1f) != 0)
204 			ulOffset = (ulOffset + 32L) & 0xffffffE0L;
205 
206 		tmp = STG_READ_REG(DACOverlayUAddr);
207 		CLEAR_BITS_FRM_TO(0, 20);
208 		tmp |= (ulOffset >> 4);
209 		STG_WRITE_REG(DACOverlayUAddr, tmp);
210 
211 		ulOffset += (inHeight / 2) * (uvStride * 16);
212 		/* Align U,V data to 32byte boundary */
213 		if ((ulOffset & 0x1f) != 0)
214 			ulOffset = (ulOffset + 32L) & 0xffffffE0L;
215 
216 		tmp = STG_READ_REG(DACOverlayVAddr);
217 		CLEAR_BITS_FRM_TO(0, 20);
218 		tmp |= (ulOffset >> 4);
219 		STG_WRITE_REG(DACOverlayVAddr, tmp);
220 
221 		*retUVStride = uvStride * 16;
222 	}
223 
224 
225 	/* Set Overlay YUV pixel format
226 	 * Make sure that LUT not used - ??????
227 	 */
228 	tmp = STG_READ_REG(DACPixelFormat);
229 	/* Only support Planer or UYVY linear formats */
230 	CLEAR_BITS_FRM_TO(4, 9);
231 	STG_WRITE_REG(DACPixelFormat, tmp);
232 
233 	ovlWidth = inWidth;
234 	ovlHeight = inHeight;
235 	ovlStride = ulStride;
236 	ovlLinear = bLinear;
237 	*retStride = ulStride << 4;	/* In bytes */
238 
239 	return 0;
240 }
241 
SetOverlayBlendMode(volatile STG4000REG __iomem * pSTGReg,OVRL_BLEND_MODE mode,u32 ulAlpha,u32 ulColorKey)242 int SetOverlayBlendMode(volatile STG4000REG __iomem *pSTGReg,
243 			OVRL_BLEND_MODE mode,
244 			u32 ulAlpha, u32 ulColorKey)
245 {
246 	u32 tmp;
247 
248 	tmp = STG_READ_REG(DACBlendCtrl);
249 	CLEAR_BITS_FRM_TO(28, 30);
250 	tmp |= (mode << 28);
251 
252 	switch (mode) {
253 	case COLOR_KEY:
254 		CLEAR_BITS_FRM_TO(0, 23);
255 		tmp |= (ulColorKey & 0x00FFFFFF);
256 		break;
257 
258 	case GLOBAL_ALPHA:
259 		CLEAR_BITS_FRM_TO(24, 27);
260 		tmp |= ((ulAlpha & 0xF) << 24);
261 		break;
262 
263 	case CK_PIXEL_ALPHA:
264 		CLEAR_BITS_FRM_TO(0, 23);
265 		tmp |= (ulColorKey & 0x00FFFFFF);
266 		break;
267 
268 	case CK_GLOBAL_ALPHA:
269 		CLEAR_BITS_FRM_TO(0, 23);
270 		tmp |= (ulColorKey & 0x00FFFFFF);
271 		CLEAR_BITS_FRM_TO(24, 27);
272 		tmp |= ((ulAlpha & 0xF) << 24);
273 		break;
274 
275 	case GRAPHICS_MODE:
276 	case PER_PIXEL_ALPHA:
277 		break;
278 
279 	default:
280 		return -EINVAL;
281 	}
282 
283 	STG_WRITE_REG(DACBlendCtrl, tmp);
284 
285 	return 0;
286 }
287 
EnableOverlayPlane(volatile STG4000REG __iomem * pSTGReg)288 void EnableOverlayPlane(volatile STG4000REG __iomem *pSTGReg)
289 {
290 	u32 tmp;
291 	/* Enable Overlay */
292 	tmp = STG_READ_REG(DACPixelFormat);
293 	tmp |= SET_BIT(7);
294 	STG_WRITE_REG(DACPixelFormat, tmp);
295 
296 	/* Set video stream control */
297 	tmp = STG_READ_REG(DACStreamCtrl);
298 	tmp |= SET_BIT(1);	/* video stream */
299 	STG_WRITE_REG(DACStreamCtrl, tmp);
300 }
301 
Overlap(u32 ulBits,u32 ulPattern)302 static u32 Overlap(u32 ulBits, u32 ulPattern)
303 {
304 	u32 ulCount = 0;
305 
306 	while (ulBits) {
307 		if (!(ulPattern & 1))
308 			ulCount++;
309 		ulBits--;
310 		ulPattern = ulPattern >> 1;
311 	}
312 
313 	return ulCount;
314 
315 }
316 
SetOverlayViewPort(volatile STG4000REG __iomem * pSTGReg,u32 left,u32 top,u32 right,u32 bottom)317 int SetOverlayViewPort(volatile STG4000REG __iomem *pSTGReg,
318 		       u32 left, u32 top,
319 		       u32 right, u32 bottom)
320 {
321 	OVRL_SRC_DEST srcDest;
322 
323 	u32 ulSrcTop, ulSrcBottom;
324 	u32 ulSrc, ulDest;
325 	u32 ulFxScale, ulFxOffset;
326 	u32 ulHeight, ulWidth;
327 	u32 ulPattern;
328 	u32 ulDecimate, ulDecimated;
329 	u32 ulApplied;
330 	u32 ulDacXScale, ulDacYScale;
331 	u32 ulScale;
332 	u32 ulLeft, ulRight;
333 	u32 ulSrcLeft, ulSrcRight;
334 	u32 ulScaleLeft;
335 	u32 ulhDecim;
336 	u32 ulsVal;
337 	u32 ulVertDecFactor;
338 	int bResult;
339 	u32 ulClipOff = 0;
340 	u32 ulBits = 0;
341 	u32 ulsAdd = 0;
342 	u32 tmp, ulStride;
343 	u32 ulExcessPixels, ulClip, ulExtraLines;
344 
345 
346 	srcDest.ulSrcX1 = 0;
347 	srcDest.ulSrcY1 = 0;
348 	srcDest.ulSrcX2 = ovlWidth - 1;
349 	srcDest.ulSrcY2 = ovlHeight - 1;
350 
351 	srcDest.ulDstX1 = left;
352 	srcDest.ulDstY1 = top;
353 	srcDest.ulDstX2 = right;
354 	srcDest.ulDstY2 = bottom;
355 
356 	srcDest.lDstX1 = srcDest.ulDstX1;
357 	srcDest.lDstY1 = srcDest.ulDstY1;
358 	srcDest.lDstX2 = srcDest.ulDstX2;
359 	srcDest.lDstY2 = srcDest.ulDstY2;
360 
361     /************* Vertical decimation/scaling ******************/
362 
363 	/* Get Src Top and Bottom */
364 	ulSrcTop = srcDest.ulSrcY1;
365 	ulSrcBottom = srcDest.ulSrcY2;
366 
367 	ulSrc = ulSrcBottom - ulSrcTop;
368 	ulDest = srcDest.lDstY2 - srcDest.lDstY1;	/* on-screen overlay */
369 
370 	if (ulSrc <= 1)
371 		return -EINVAL;
372 
373 	/* First work out the position we are to display as offset from the
374 	 * source of the buffer
375 	 */
376 	ulFxScale = (ulDest << 11) / ulSrc;	/* fixed point scale factor */
377 	ulFxOffset = (srcDest.lDstY2 - srcDest.ulDstY2) << 11;
378 
379 	ulSrcBottom = ulSrcBottom - (ulFxOffset / ulFxScale);
380 	ulSrc = ulSrcBottom - ulSrcTop;
381 	ulHeight = ulSrc;
382 
383 	ulDest = srcDest.ulDstY2 - (srcDest.ulDstY1 - 1);
384 	ulPattern = adwDecim8[ulBits];
385 
386 	/* At this point ulSrc represents the input decimator */
387 	if (ulSrc > ulDest) {
388 		ulDecimate = ulSrc - ulDest;
389 		ulBits = 0;
390 		ulApplied = ulSrc / 32;
391 
392 		while (((ulBits * ulApplied) +
393 			Overlap((ulSrc % 32),
394 				adwDecim8[ulBits])) < ulDecimate)
395 			ulBits++;
396 
397 		ulPattern = adwDecim8[ulBits];
398 		ulDecimated =
399 		    (ulBits * ulApplied) + Overlap((ulSrc % 32),
400 						   ulPattern);
401 		ulSrc = ulSrc - ulDecimated;	/* the number number of lines that will go into the scaler */
402 	}
403 
404 	if (ulBits && (ulBits != 32)) {
405 		ulVertDecFactor = (63 - ulBits) / (32 - ulBits);	/* vertical decimation factor scaled up to nearest integer */
406 	} else {
407 		ulVertDecFactor = 1;
408 	}
409 
410 	ulDacYScale = ((ulSrc - 1) * 2048) / (ulDest + 1);
411 
412 	tmp = STG_READ_REG(DACOverlayVtDec);	/* Decimation */
413 	CLEAR_BITS_FRM_TO(0, 31);
414 	tmp = ulPattern;
415 	STG_WRITE_REG(DACOverlayVtDec, tmp);
416 
417 	/***************** Horizontal decimation/scaling ***************************/
418 
419 	/*
420 	 * Now we handle the horizontal case, this is a simplified version of
421 	 * the vertical case in that we decimate by factors of 2.  as we are
422 	 * working in words we should always be able to decimate by these
423 	 * factors.  as we always have to have a buffer which is aligned to a
424 	 * whole number of 128 bit words, we must align the left side to the
425 	 * lowest to the next lowest 128 bit boundary, and the right hand edge
426 	 * to the next largets boundary, (in a similar way to how we didi it in
427 	 * PMX1) as the left and right hand edges are aligned to these
428 	 * boundaries normally this only becomes an issue when we are chopping
429 	 * of one of the sides We shall work out vertical stuff first
430 	 */
431 	ulSrc = srcDest.ulSrcX2 - srcDest.ulSrcX1;
432 	ulDest = srcDest.lDstX2 - srcDest.lDstX1;
433 #ifdef _OLDCODE
434 	ulLeft = srcDest.ulDstX1;
435 	ulRight = srcDest.ulDstX2;
436 #else
437 	if (srcDest.ulDstX1 > 2) {
438 		ulLeft = srcDest.ulDstX1 + 2;
439 		ulRight = srcDest.ulDstX2 + 1;
440 	} else {
441 		ulLeft = srcDest.ulDstX1;
442 		ulRight = srcDest.ulDstX2 + 1;
443 	}
444 #endif
445 	/* first work out the position we are to display as offset from the source of the buffer */
446 	bResult = 1;
447 
448 	do {
449 		if (ulDest == 0)
450 			return -EINVAL;
451 
452 		/* source pixels per dest pixel <<11 */
453 		ulFxScale = ((ulSrc - 1) << 11) / (ulDest);
454 
455 		/* then number of destination pixels out we are */
456 		ulFxOffset = ulFxScale * ((srcDest.ulDstX1 - srcDest.lDstX1) + ulClipOff);
457 		ulFxOffset >>= 11;
458 
459 		/* this replaces the code which was making a decision as to use either ulFxOffset or ulSrcX1 */
460 		ulSrcLeft = srcDest.ulSrcX1 + ulFxOffset;
461 
462 		/* then number of destination pixels out we are */
463 		ulFxOffset = ulFxScale * (srcDest.lDstX2 - srcDest.ulDstX2);
464 		ulFxOffset >>= 11;
465 
466 		ulSrcRight = srcDest.ulSrcX2 - ulFxOffset;
467 
468 		/*
469 		 * we must align these to our 128 bit boundaries. we shall
470 		 * round down the pixel pos to the nearest 8 pixels.
471 		 */
472 		ulScaleLeft = ulSrcLeft;
473 
474 		/* shift fxscale until it is in the range of the scaler */
475 		ulhDecim = 0;
476 		ulScale = (((ulSrcRight - ulSrcLeft) - 1) << (11 - ulhDecim)) / (ulRight - ulLeft + 2);
477 
478 		while (ulScale > 0x800) {
479 			ulhDecim++;
480 			ulScale = (((ulSrcRight - ulSrcLeft) - 1) << (11 - ulhDecim)) / (ulRight - ulLeft + 2);
481 		}
482 
483 		/*
484 		 * to try and get the best values We first try and use
485 		 * src/dwdest for the scale factor, then we move onto src-1
486 		 *
487 		 * we want to check to see if we will need to clip data, if so
488 		 * then we should clip our source so that we don't need to
489 		 */
490 		if (!ovlLinear) {
491 			ulSrcLeft &= ~0x1f;
492 
493 			/*
494 			 * we must align the right hand edge to the next 32
495 			 * pixel` boundary, must be on a 256 boundary so u, and
496 			 * v are 128 bit aligned
497 			 */
498 			ulSrcRight = (ulSrcRight + 0x1f) & ~0x1f;
499 		} else {
500 			ulSrcLeft &= ~0x7;
501 
502 			/*
503 			 * we must align the right hand edge to the next
504 			 * 8pixel` boundary
505 			 */
506 			ulSrcRight = (ulSrcRight + 0x7) & ~0x7;
507 		}
508 
509 		/* this is the input size line store needs to cope with */
510 		ulWidth = ulSrcRight - ulSrcLeft;
511 
512 		/*
513 		 * use unclipped value to work out scale factror this is the
514 		 * scale factor we want we shall now work out the horizonal
515 		 * decimation and scaling
516 		 */
517 		ulsVal = ((ulWidth / 8) >> ulhDecim);
518 
519 		if ((ulWidth != (ulsVal << ulhDecim) * 8))
520 			ulsAdd = 1;
521 
522 		/* input pixels to scaler; */
523 		ulSrc = ulWidth >> ulhDecim;
524 
525 		if (ulSrc <= 2)
526 			return -EINVAL;
527 
528 		ulExcessPixels = ((((ulScaleLeft - ulSrcLeft)) << (11 - ulhDecim)) / ulScale);
529 
530 		ulClip = (ulSrc << 11) / ulScale;
531 		ulClip -= (ulRight - ulLeft);
532 		ulClip += ulExcessPixels;
533 
534 		if (ulClip)
535 			ulClip--;
536 
537 		/* We may need to do more here if we really have a HW rev < 5 */
538 	} while (!bResult);
539 
540 	ulExtraLines = (1 << ulhDecim) * ulVertDecFactor;
541 	ulExtraLines += 64;
542 	ulHeight += ulExtraLines;
543 
544 	ulDacXScale = ulScale;
545 
546 
547 	tmp = STG_READ_REG(DACVerticalScal);
548 	CLEAR_BITS_FRM_TO(0, 11);
549 	CLEAR_BITS_FRM_TO(16, 22);	/* Vertical Scaling */
550 
551 	/* Calculate new output line stride, this is always the number of 422
552 	   words in the line buffer, so it doesn't matter if the
553 	   mode is 420. Then set the vertical scale register.
554 	 */
555 	ulStride = (ulWidth >> (ulhDecim + 3)) + ulsAdd;
556 	tmp |= ((ulStride << 16) | (ulDacYScale));	/* DAC_LS_CTRL = stride */
557 	STG_WRITE_REG(DACVerticalScal, tmp);
558 
559 	/* Now set up the overlay size using the modified width and height
560 	   from decimate and scaling calculations
561 	 */
562 	tmp = STG_READ_REG(DACOverlaySize);
563 	CLEAR_BITS_FRM_TO(0, 10);
564 	CLEAR_BITS_FRM_TO(12, 31);
565 
566 	if (ovlLinear) {
567 		tmp |=
568 		    (ovlStride | ((ulHeight + 1) << 12) |
569 		     (((ulWidth / 8) - 1) << 23));
570 	} else {
571 		tmp |=
572 		    (ovlStride | ((ulHeight + 1) << 12) |
573 		     (((ulWidth / 32) - 1) << 23));
574 	}
575 
576 	STG_WRITE_REG(DACOverlaySize, tmp);
577 
578 	/* Set Video Window Start */
579 	tmp = ((ulLeft << 16)) | (srcDest.ulDstY1);
580 	STG_WRITE_REG(DACVidWinStart, tmp);
581 
582 	/* Set Video Window End */
583 	tmp = ((ulRight) << 16) | (srcDest.ulDstY2);
584 	STG_WRITE_REG(DACVidWinEnd, tmp);
585 
586 	/* Finally set up the rest of the overlay regs in the order
587 	   done in the IMG driver
588 	 */
589 	tmp = STG_READ_REG(DACPixelFormat);
590 	tmp = ((ulExcessPixels << 16) | tmp) & 0x7fffffff;
591 	STG_WRITE_REG(DACPixelFormat, tmp);
592 
593 	tmp = STG_READ_REG(DACHorizontalScal);
594 	CLEAR_BITS_FRM_TO(0, 11);
595 	CLEAR_BITS_FRM_TO(16, 17);
596 	tmp |= ((ulhDecim << 16) | (ulDacXScale));
597 	STG_WRITE_REG(DACHorizontalScal, tmp);
598 
599 	return 0;
600 }
601