2 * linux/drivers/video/kyro/STG4000OverlayDevice.c
4 * Copyright (C) 2000 Imagination Technologies Ltd
5 * Copyright (C) 2002 STMicroelectronics
7 * This file is subject to the terms and conditions of the GNU General Public
8 * License. See the file COPYING in the main directory of this archive
12 #include <linux/kernel.h>
13 #include <linux/errno.h>
14 #include <linux/types.h>
16 #include "STG4000Reg.h"
17 #include "STG4000Interface.h"
21 #define STG4000_NO_SCALING 0x800
22 #define STG4000_NO_DECIMATION 0xFFFFFFFF
25 #define STG4000_PRIM_NUM_PIX 5
26 #define STG4000_PRIM_ALIGN 4
27 #define STG4000_PRIM_ADDR_BITS 20
29 #define STG4000_PRIM_MIN_WIDTH 640
30 #define STG4000_PRIM_MAX_WIDTH 1600
31 #define STG4000_PRIM_MIN_HEIGHT 480
32 #define STG4000_PRIM_MAX_HEIGHT 1200
35 #define STG4000_OVRL_NUM_PIX 4
36 #define STG4000_OVRL_ALIGN 2
37 #define STG4000_OVRL_ADDR_BITS 20
38 #define STG4000_OVRL_NUM_MODES 5
40 #define STG4000_OVRL_MIN_WIDTH 0
41 #define STG4000_OVRL_MAX_WIDTH 720
42 #define STG4000_OVRL_MIN_HEIGHT 0
43 #define STG4000_OVRL_MAX_HEIGHT 576
45 /* Decimation and Scaling */
46 static u32 adwDecim8[33] = {
47 0xffffffff, 0xfffeffff, 0xffdffbff, 0xfefefeff, 0xfdf7efbf,
48 0xfbdf7bdf, 0xf7bbddef, 0xeeeeeeef, 0xeeddbb77, 0xedb76db7,
49 0xdb6db6db, 0xdb5b5b5b, 0xdab5ad6b, 0xd5ab55ab, 0xd555aaab,
50 0xaaaaaaab, 0xaaaa5555, 0xaa952a55, 0xa94a5295, 0xa5252525,
51 0xa4924925, 0x92491249, 0x91224489, 0x91111111, 0x90884211,
52 0x88410821, 0x88102041, 0x81010101, 0x80800801, 0x80010001,
53 0x80000001, 0x00000001, 0x00000000
56 typedef struct _OVRL_SRC_DEST {
57 /*clipped on-screen pixel position of overlay */
63 /*clipped pixel pos of source data within buffer thses need to be 128 bit word aligned */
69 /* on-screen pixel position of overlay */
76 static u32 ovlWidth, ovlHeight, ovlStride;
79 void ResetOverlayRegisters(volatile STG4000REG __iomem *pSTGReg)
83 /* Set Overlay address to default */
84 tmp = STG_READ_REG(DACOverlayAddr);
85 CLEAR_BITS_FRM_TO(0, 20);
87 STG_WRITE_REG(DACOverlayAddr, tmp);
89 /* Set Overlay U address */
90 tmp = STG_READ_REG(DACOverlayUAddr);
91 CLEAR_BITS_FRM_TO(0, 20);
92 STG_WRITE_REG(DACOverlayUAddr, tmp);
94 /* Set Overlay V address */
95 tmp = STG_READ_REG(DACOverlayVAddr);
96 CLEAR_BITS_FRM_TO(0, 20);
97 STG_WRITE_REG(DACOverlayVAddr, tmp);
99 /* Set Overlay Size */
100 tmp = STG_READ_REG(DACOverlaySize);
101 CLEAR_BITS_FRM_TO(0, 10);
102 CLEAR_BITS_FRM_TO(12, 31);
103 STG_WRITE_REG(DACOverlaySize, tmp);
105 /* Set Overlay Vt Decimation */
106 tmp = STG4000_NO_DECIMATION;
107 STG_WRITE_REG(DACOverlayVtDec, tmp);
109 /* Set Overlay format to default value */
110 tmp = STG_READ_REG(DACPixelFormat);
111 CLEAR_BITS_FRM_TO(4, 7);
112 CLEAR_BITS_FRM_TO(16, 22);
113 STG_WRITE_REG(DACPixelFormat, tmp);
115 /* Set Vertical scaling to default */
116 tmp = STG_READ_REG(DACVerticalScal);
117 CLEAR_BITS_FRM_TO(0, 11);
118 CLEAR_BITS_FRM_TO(16, 22);
119 tmp |= STG4000_NO_SCALING; /* Set to no scaling */
120 STG_WRITE_REG(DACVerticalScal, tmp);
122 /* Set Horizontal Scaling to default */
123 tmp = STG_READ_REG(DACHorizontalScal);
124 CLEAR_BITS_FRM_TO(0, 11);
125 CLEAR_BITS_FRM_TO(16, 17);
126 tmp |= STG4000_NO_SCALING; /* Set to no scaling */
127 STG_WRITE_REG(DACHorizontalScal, tmp);
129 /* Set Blend mode to Alpha Blend */
130 /* ????? SG 08/11/2001 Surely this isn't the alpha blend mode,
131 hopefully its overwrite
133 tmp = STG_READ_REG(DACBlendCtrl);
134 CLEAR_BITS_FRM_TO(0, 30);
135 tmp = (GRAPHICS_MODE << 28);
136 STG_WRITE_REG(DACBlendCtrl, tmp);
140 int CreateOverlaySurface(volatile STG4000REG __iomem *pSTGReg,
145 u32 * retStride, u32 * retUVStride)
150 if (inWidth > STG4000_OVRL_MAX_WIDTH ||
151 inHeight > STG4000_OVRL_MAX_HEIGHT) {
155 /* Stride in 16 byte words - 16Bpp */
157 /* Format is 16bits so num 16 byte words is width/8 */
158 if ((inWidth & 0x7) == 0) { /* inWidth % 8 */
159 ulStride = (inWidth / 8);
161 /* Round up to next 16byte boundary */
162 ulStride = ((inWidth + 8) / 8);
165 /* Y component is 8bits so num 16 byte words is width/16 */
166 if ((inWidth & 0xf) == 0) { /* inWidth % 16 */
167 ulStride = (inWidth / 16);
169 /* Round up to next 16byte boundary */
170 ulStride = ((inWidth + 16) / 16);
175 /* Set Overlay address and Format mode */
176 tmp = STG_READ_REG(DACOverlayAddr);
177 CLEAR_BITS_FRM_TO(0, 20);
179 CLEAR_BIT(31); /* Overlay format to Linear */
181 tmp |= SET_BIT(31); /* Overlay format to Planer */
184 /* Only bits 24:4 of the Overlay address */
185 tmp |= (ulOverlayOffset >> 4);
186 STG_WRITE_REG(DACOverlayAddr, tmp);
190 (inWidth & 0x1) ? (inWidth + 1 / 2) : (inWidth / 2);
193 /* Y component is 8bits so num 32 byte words is width/32 */
194 if ((uvSize & 0xf) == 0) { /* inWidth % 16 */
195 uvStride = (uvSize / 16);
197 /* Round up to next 32byte boundary */
198 uvStride = ((uvSize + 16) / 16);
201 ulOffset = ulOverlayOffset + (inHeight * (ulStride * 16));
202 /* Align U,V data to 32byte boundary */
203 if ((ulOffset & 0x1f) != 0)
204 ulOffset = (ulOffset + 32L) & 0xffffffE0L;
206 tmp = STG_READ_REG(DACOverlayUAddr);
207 CLEAR_BITS_FRM_TO(0, 20);
208 tmp |= (ulOffset >> 4);
209 STG_WRITE_REG(DACOverlayUAddr, tmp);
211 ulOffset += (inHeight / 2) * (uvStride * 16);
212 /* Align U,V data to 32byte boundary */
213 if ((ulOffset & 0x1f) != 0)
214 ulOffset = (ulOffset + 32L) & 0xffffffE0L;
216 tmp = STG_READ_REG(DACOverlayVAddr);
217 CLEAR_BITS_FRM_TO(0, 20);
218 tmp |= (ulOffset >> 4);
219 STG_WRITE_REG(DACOverlayVAddr, tmp);
221 *retUVStride = uvStride * 16;
225 /* Set Overlay YUV pixel format
226 * Make sure that LUT not used - ??????
228 tmp = STG_READ_REG(DACPixelFormat);
229 /* Only support Planer or UYVY linear formats */
230 CLEAR_BITS_FRM_TO(4, 9);
231 STG_WRITE_REG(DACPixelFormat, tmp);
234 ovlHeight = inHeight;
235 ovlStride = ulStride;
237 *retStride = ulStride << 4; /* In bytes */
242 int SetOverlayBlendMode(volatile STG4000REG __iomem *pSTGReg,
243 OVRL_BLEND_MODE mode,
244 u32 ulAlpha, u32 ulColorKey)
248 tmp = STG_READ_REG(DACBlendCtrl);
249 CLEAR_BITS_FRM_TO(28, 30);
254 CLEAR_BITS_FRM_TO(0, 23);
255 tmp |= (ulColorKey & 0x00FFFFFF);
259 CLEAR_BITS_FRM_TO(24, 27);
260 tmp |= ((ulAlpha & 0xF) << 24);
264 CLEAR_BITS_FRM_TO(0, 23);
265 tmp |= (ulColorKey & 0x00FFFFFF);
268 case CK_GLOBAL_ALPHA:
269 CLEAR_BITS_FRM_TO(0, 23);
270 tmp |= (ulColorKey & 0x00FFFFFF);
271 CLEAR_BITS_FRM_TO(24, 27);
272 tmp |= ((ulAlpha & 0xF) << 24);
276 case PER_PIXEL_ALPHA:
283 STG_WRITE_REG(DACBlendCtrl, tmp);
288 void EnableOverlayPlane(volatile STG4000REG __iomem *pSTGReg)
292 tmp = STG_READ_REG(DACPixelFormat);
294 STG_WRITE_REG(DACPixelFormat, tmp);
296 /* Set video stream control */
297 tmp = STG_READ_REG(DACStreamCtrl);
298 tmp |= SET_BIT(1); /* video stream */
299 STG_WRITE_REG(DACStreamCtrl, tmp);
302 static u32 Overlap(u32 ulBits, u32 ulPattern)
307 if (!(ulPattern & 1))
310 ulPattern = ulPattern >> 1;
317 int SetOverlayViewPort(volatile STG4000REG __iomem *pSTGReg,
319 u32 right, u32 bottom)
321 OVRL_SRC_DEST srcDest;
323 u32 ulSrcTop, ulSrcBottom;
325 u32 ulFxScale, ulFxOffset;
326 u32 ulHeight, ulWidth;
328 u32 ulDecimate, ulDecimated;
330 u32 ulDacXScale, ulDacYScale;
333 u32 ulSrcLeft, ulSrcRight;
334 u32 ulScaleLeft, ulScaleRight;
343 u32 ulExcessPixels, ulClip, ulExtraLines;
348 srcDest.ulSrcX2 = ovlWidth - 1;
349 srcDest.ulSrcY2 = ovlHeight - 1;
351 srcDest.ulDstX1 = left;
352 srcDest.ulDstY1 = top;
353 srcDest.ulDstX2 = right;
354 srcDest.ulDstY2 = bottom;
356 srcDest.lDstX1 = srcDest.ulDstX1;
357 srcDest.lDstY1 = srcDest.ulDstY1;
358 srcDest.lDstX2 = srcDest.ulDstX2;
359 srcDest.lDstY2 = srcDest.ulDstY2;
361 /************* Vertical decimation/scaling ******************/
363 /* Get Src Top and Bottom */
364 ulSrcTop = srcDest.ulSrcY1;
365 ulSrcBottom = srcDest.ulSrcY2;
367 ulSrc = ulSrcBottom - ulSrcTop;
368 ulDest = srcDest.lDstY2 - srcDest.lDstY1; /* on-screen overlay */
373 /* First work out the position we are to display as offset from the
374 * source of the buffer
376 ulFxScale = (ulDest << 11) / ulSrc; /* fixed point scale factor */
377 ulFxOffset = (srcDest.lDstY2 - srcDest.ulDstY2) << 11;
379 ulSrcBottom = ulSrcBottom - (ulFxOffset / ulFxScale);
380 ulSrc = ulSrcBottom - ulSrcTop;
383 ulDest = srcDest.ulDstY2 - (srcDest.ulDstY1 - 1);
384 ulPattern = adwDecim8[ulBits];
386 /* At this point ulSrc represents the input decimator */
387 if (ulSrc > ulDest) {
388 ulDecimate = ulSrc - ulDest;
390 ulApplied = ulSrc / 32;
392 while (((ulBits * ulApplied) +
393 Overlap((ulSrc % 32),
394 adwDecim8[ulBits])) < ulDecimate)
397 ulPattern = adwDecim8[ulBits];
399 (ulBits * ulApplied) + Overlap((ulSrc % 32),
401 ulSrc = ulSrc - ulDecimated; /* the number number of lines that will go into the scaler */
404 if (ulBits && (ulBits != 32)) {
405 ulVertDecFactor = (63 - ulBits) / (32 - ulBits); /* vertical decimation factor scaled up to nearest integer */
410 ulDacYScale = ((ulSrc - 1) * 2048) / (ulDest + 1);
412 tmp = STG_READ_REG(DACOverlayVtDec); /* Decimation */
413 CLEAR_BITS_FRM_TO(0, 31);
415 STG_WRITE_REG(DACOverlayVtDec, tmp);
417 /***************** Horizontal decimation/scaling ***************************/
420 * Now we handle the horizontal case, this is a simplified verison of
421 * the vertical case in that we decimate by factors of 2. as we are
422 * working in words we should always be able to decimate by these
423 * factors. as we always have to have a buffer which is aligned to a
424 * whole number of 128 bit words, we must align the left side to the
425 * lowest to the next lowest 128 bit boundary, and the right hand edge
426 * to the next largets boundary, (in a similar way to how we didi it in
427 * PMX1) as the left and right hand edges are aligned to these
428 * boundaries normally this only becomes an issue when we are chopping
429 * of one of the sides We shall work out vertical stuff first
431 ulSrc = srcDest.ulSrcX2 - srcDest.ulSrcX1;
432 ulDest = srcDest.lDstX2 - srcDest.lDstX1;
434 ulLeft = srcDest.ulDstX1;
435 ulRight = srcDest.ulDstX2;
437 if (srcDest.ulDstX1 > 2) {
438 ulLeft = srcDest.ulDstX1 + 2;
439 ulRight = srcDest.ulDstX2 + 1;
441 ulLeft = srcDest.ulDstX1;
442 ulRight = srcDest.ulDstX2 + 1;
445 /* first work out the position we are to display as offset from the source of the buffer */
452 /* source pixels per dest pixel <<11 */
453 ulFxScale = ((ulSrc - 1) << 11) / (ulDest);
455 /* then number of destination pixels out we are */
456 ulFxOffset = ulFxScale * ((srcDest.ulDstX1 - srcDest.lDstX1) + ulClipOff);
459 /* this replaces the code which was making a decision as to use either ulFxOffset or ulSrcX1 */
460 ulSrcLeft = srcDest.ulSrcX1 + ulFxOffset;
462 /* then number of destination pixels out we are */
463 ulFxOffset = ulFxScale * (srcDest.lDstX2 - srcDest.ulDstX2);
466 ulSrcRight = srcDest.ulSrcX2 - ulFxOffset;
469 * we must align these to our 128 bit boundaries. we shall
470 * round down the pixel pos to the nearest 8 pixels.
472 ulScaleLeft = ulSrcLeft;
473 ulScaleRight = ulSrcRight;
475 /* shift fxscale until it is in the range of the scaler */
477 ulScale = (((ulSrcRight - ulSrcLeft) - 1) << (11 - ulhDecim)) / (ulRight - ulLeft + 2);
479 while (ulScale > 0x800) {
481 ulScale = (((ulSrcRight - ulSrcLeft) - 1) << (11 - ulhDecim)) / (ulRight - ulLeft + 2);
485 * to try and get the best values We first try and use
486 * src/dwdest for the scale factor, then we move onto src-1
488 * we want to check to see if we will need to clip data, if so
489 * then we should clip our source so that we don't need to
495 * we must align the right hand edge to the next 32
496 * pixel` boundary, must be on a 256 boundary so u, and
497 * v are 128 bit aligned
499 ulSrcRight = (ulSrcRight + 0x1f) & ~0x1f;
504 * we must align the right hand edge to the next
507 ulSrcRight = (ulSrcRight + 0x7) & ~0x7;
510 /* this is the input size line store needs to cope with */
511 ulWidth = ulSrcRight - ulSrcLeft;
514 * use unclipped value to work out scale factror this is the
515 * scale factor we want we shall now work out the horizonal
516 * decimation and scaling
518 ulsVal = ((ulWidth / 8) >> ulhDecim);
520 if ((ulWidth != (ulsVal << ulhDecim) * 8))
523 /* input pixels to scaler; */
524 ulSrc = ulWidth >> ulhDecim;
529 ulExcessPixels = ((((ulScaleLeft - ulSrcLeft)) << (11 - ulhDecim)) / ulScale);
531 ulClip = (ulSrc << 11) / ulScale;
532 ulClip -= (ulRight - ulLeft);
533 ulClip += ulExcessPixels;
538 /* We may need to do more here if we really have a HW rev < 5 */
541 ulExtraLines = (1 << ulhDecim) * ulVertDecFactor;
543 ulHeight += ulExtraLines;
545 ulDacXScale = ulScale;
548 tmp = STG_READ_REG(DACVerticalScal);
549 CLEAR_BITS_FRM_TO(0, 11);
550 CLEAR_BITS_FRM_TO(16, 22); /* Vertical Scaling */
552 /* Calculate new output line stride, this is always the number of 422
553 words in the line buffer, so it doesn't matter if the
554 mode is 420. Then set the vertical scale register.
556 ulStride = (ulWidth >> (ulhDecim + 3)) + ulsAdd;
557 tmp |= ((ulStride << 16) | (ulDacYScale)); /* DAC_LS_CTRL = stride */
558 STG_WRITE_REG(DACVerticalScal, tmp);
560 /* Now set up the overlay size using the modified width and height
561 from decimate and scaling calculations
563 tmp = STG_READ_REG(DACOverlaySize);
564 CLEAR_BITS_FRM_TO(0, 10);
565 CLEAR_BITS_FRM_TO(12, 31);
569 (ovlStride | ((ulHeight + 1) << 12) |
570 (((ulWidth / 8) - 1) << 23));
573 (ovlStride | ((ulHeight + 1) << 12) |
574 (((ulWidth / 32) - 1) << 23));
577 STG_WRITE_REG(DACOverlaySize, tmp);
579 /* Set Video Window Start */
580 tmp = ((ulLeft << 16)) | (srcDest.ulDstY1);
581 STG_WRITE_REG(DACVidWinStart, tmp);
583 /* Set Video Window End */
584 tmp = ((ulRight) << 16) | (srcDest.ulDstY2);
585 STG_WRITE_REG(DACVidWinEnd, tmp);
587 /* Finally set up the rest of the overlay regs in the order
588 done in the IMG driver
590 tmp = STG_READ_REG(DACPixelFormat);
591 tmp = ((ulExcessPixels << 16) | tmp) & 0x7fffffff;
592 STG_WRITE_REG(DACPixelFormat, tmp);
594 tmp = STG_READ_REG(DACHorizontalScal);
595 CLEAR_BITS_FRM_TO(0, 11);
596 CLEAR_BITS_FRM_TO(16, 17);
597 tmp |= ((ulhDecim << 16) | (ulDacXScale));
598 STG_WRITE_REG(DACHorizontalScal, tmp);