linux/drivers/media/common/saa7146/saa7146_hlp.c
<<
>>
Prefs
   1#define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
   2
   3#include <linux/kernel.h>
   4#include <linux/export.h>
   5#include <media/drv-intf/saa7146_vv.h>
   6
   7static void calculate_output_format_register(struct saa7146_dev* saa, u32 palette, u32* clip_format)
   8{
   9        /* clear out the necessary bits */
  10        *clip_format &= 0x0000ffff;
  11        /* set these bits new */
  12        *clip_format |=  (( ((palette&0xf00)>>8) << 30) | ((palette&0x00f) << 24) | (((palette&0x0f0)>>4) << 16));
  13}
  14
  15static void calculate_hps_source_and_sync(struct saa7146_dev *dev, int source, int sync, u32* hps_ctrl)
  16{
  17        *hps_ctrl &= ~(MASK_30 | MASK_31 | MASK_28);
  18        *hps_ctrl |= (source << 30) | (sync << 28);
  19}
  20
  21static void calculate_hxo_and_hyo(struct saa7146_vv *vv, u32* hps_h_scale, u32* hps_ctrl)
  22{
  23        int hyo = 0, hxo = 0;
  24
  25        hyo = vv->standard->v_offset;
  26        hxo = vv->standard->h_offset;
  27
  28        *hps_h_scale    &= ~(MASK_B0 | 0xf00);
  29        *hps_h_scale    |= (hxo <<  0);
  30
  31        *hps_ctrl       &= ~(MASK_W0 | MASK_B2);
  32        *hps_ctrl       |= (hyo << 12);
  33}
  34
  35/* helper functions for the calculation of the horizontal- and vertical
  36   scaling registers, clip-format-register etc ...
  37   these functions take pointers to the (most-likely read-out
  38   original-values) and manipulate them according to the requested
  39   changes.
  40*/
  41
  42/* hps_coeff used for CXY and CXUV; scale 1/1 -> scale 1/64 */
  43static struct {
  44        u16 hps_coeff;
  45        u16 weight_sum;
  46} hps_h_coeff_tab [] = {
  47        {0x00,   2}, {0x02,   4}, {0x00,   4}, {0x06,   8}, {0x02,   8},
  48        {0x08,   8}, {0x00,   8}, {0x1E,  16}, {0x0E,   8}, {0x26,   8},
  49        {0x06,   8}, {0x42,   8}, {0x02,   8}, {0x80,   8}, {0x00,   8},
  50        {0xFE,  16}, {0xFE,   8}, {0x7E,   8}, {0x7E,   8}, {0x3E,   8},
  51        {0x3E,   8}, {0x1E,   8}, {0x1E,   8}, {0x0E,   8}, {0x0E,   8},
  52        {0x06,   8}, {0x06,   8}, {0x02,   8}, {0x02,   8}, {0x00,   8},
  53        {0x00,   8}, {0xFE,  16}, {0xFE,   8}, {0xFE,   8}, {0xFE,   8},
  54        {0xFE,   8}, {0xFE,   8}, {0xFE,   8}, {0xFE,   8}, {0xFE,   8},
  55        {0xFE,   8}, {0xFE,   8}, {0xFE,   8}, {0xFE,   8}, {0xFE,   8},
  56        {0xFE,   8}, {0xFE,   8}, {0xFE,   8}, {0xFE,   8}, {0x7E,   8},
  57        {0x7E,   8}, {0x3E,   8}, {0x3E,   8}, {0x1E,   8}, {0x1E,   8},
  58        {0x0E,   8}, {0x0E,   8}, {0x06,   8}, {0x06,   8}, {0x02,   8},
  59        {0x02,   8}, {0x00,   8}, {0x00,   8}, {0xFE,  16}
  60};
  61
  62/* table of attenuation values for horizontal scaling */
  63static u8 h_attenuation[] = { 1, 2, 4, 8, 2, 4, 8, 16, 0};
  64
  65/* calculate horizontal scale registers */
  66static int calculate_h_scale_registers(struct saa7146_dev *dev,
  67        int in_x, int out_x, int flip_lr,
  68        u32* hps_ctrl, u32* hps_v_gain, u32* hps_h_prescale, u32* hps_h_scale)
  69{
  70        /* horizontal prescaler */
  71        u32 dcgx = 0, xpsc = 0, xacm = 0, cxy = 0, cxuv = 0;
  72        /* horizontal scaler */
  73        u32 xim = 0, xp = 0, xsci =0;
  74        /* vertical scale & gain */
  75        u32 pfuv = 0;
  76
  77        /* helper variables */
  78        u32 h_atten = 0, i = 0;
  79
  80        if ( 0 == out_x ) {
  81                return -EINVAL;
  82        }
  83
  84        /* mask out vanity-bit */
  85        *hps_ctrl &= ~MASK_29;
  86
  87        /* calculate prescale-(xspc)-value:     [n   .. 1/2) : 1
  88                                                [1/2 .. 1/3) : 2
  89                                                [1/3 .. 1/4) : 3
  90                                                ...             */
  91        if (in_x > out_x) {
  92                xpsc = in_x / out_x;
  93        }
  94        else {
  95                /* zooming */
  96                xpsc = 1;
  97        }
  98
  99        /* if flip_lr-bit is set, number of pixels after
 100           horizontal prescaling must be < 384 */
 101        if ( 0 != flip_lr ) {
 102
 103                /* set vanity bit */
 104                *hps_ctrl |= MASK_29;
 105
 106                while (in_x / xpsc >= 384 )
 107                        xpsc++;
 108        }
 109        /* if zooming is wanted, number of pixels after
 110           horizontal prescaling must be < 768 */
 111        else {
 112                while ( in_x / xpsc >= 768 )
 113                        xpsc++;
 114        }
 115
 116        /* maximum prescale is 64 (p.69) */
 117        if ( xpsc > 64 )
 118                xpsc = 64;
 119
 120        /* keep xacm clear*/
 121        xacm = 0;
 122
 123        /* set horizontal filter parameters (CXY = CXUV) */
 124        cxy = hps_h_coeff_tab[( (xpsc - 1) < 63 ? (xpsc - 1) : 63 )].hps_coeff;
 125        cxuv = cxy;
 126
 127        /* calculate and set horizontal fine scale (xsci) */
 128
 129        /* bypass the horizontal scaler ? */
 130        if ( (in_x == out_x) && ( 1 == xpsc ) )
 131                xsci = 0x400;
 132        else
 133                xsci = ( (1024 * in_x) / (out_x * xpsc) ) + xpsc;
 134
 135        /* set start phase for horizontal fine scale (xp) to 0 */
 136        xp = 0;
 137
 138        /* set xim, if we bypass the horizontal scaler */
 139        if ( 0x400 == xsci )
 140                xim = 1;
 141        else
 142                xim = 0;
 143
 144        /* if the prescaler is bypassed, enable horizontal
 145           accumulation mode (xacm) and clear dcgx */
 146        if( 1 == xpsc ) {
 147                xacm = 1;
 148                dcgx = 0;
 149        } else {
 150                xacm = 0;
 151                /* get best match in the table of attenuations
 152                   for horizontal scaling */
 153                h_atten = hps_h_coeff_tab[( (xpsc - 1) < 63 ? (xpsc - 1) : 63 )].weight_sum;
 154
 155                for (i = 0; h_attenuation[i] != 0; i++) {
 156                        if (h_attenuation[i] >= h_atten)
 157                                break;
 158                }
 159
 160                dcgx = i;
 161        }
 162
 163        /* the horizontal scaling increment controls the UV filter
 164           to reduce the bandwidth to improve the display quality,
 165           so set it ... */
 166        if ( xsci == 0x400)
 167                pfuv = 0x00;
 168        else if ( xsci < 0x600)
 169                pfuv = 0x01;
 170        else if ( xsci < 0x680)
 171                pfuv = 0x11;
 172        else if ( xsci < 0x700)
 173                pfuv = 0x22;
 174        else
 175                pfuv = 0x33;
 176
 177
 178        *hps_v_gain  &= MASK_W0|MASK_B2;
 179        *hps_v_gain  |= (pfuv << 24);
 180
 181        *hps_h_scale    &= ~(MASK_W1 | 0xf000);
 182        *hps_h_scale    |= (xim << 31) | (xp << 24) | (xsci << 12);
 183
 184        *hps_h_prescale |= (dcgx << 27) | ((xpsc-1) << 18) | (xacm << 17) | (cxy << 8) | (cxuv << 0);
 185
 186        return 0;
 187}
 188
 189static struct {
 190        u16 hps_coeff;
 191        u16 weight_sum;
 192} hps_v_coeff_tab [] = {
 193 {0x0100,   2},  {0x0102,   4},  {0x0300,   4},  {0x0106,   8},  {0x0502,   8},
 194 {0x0708,   8},  {0x0F00,   8},  {0x011E,  16},  {0x110E,  16},  {0x1926,  16},
 195 {0x3906,  16},  {0x3D42,  16},  {0x7D02,  16},  {0x7F80,  16},  {0xFF00,  16},
 196 {0x01FE,  32},  {0x01FE,  32},  {0x817E,  32},  {0x817E,  32},  {0xC13E,  32},
 197 {0xC13E,  32},  {0xE11E,  32},  {0xE11E,  32},  {0xF10E,  32},  {0xF10E,  32},
 198 {0xF906,  32},  {0xF906,  32},  {0xFD02,  32},  {0xFD02,  32},  {0xFF00,  32},
 199 {0xFF00,  32},  {0x01FE,  64},  {0x01FE,  64},  {0x01FE,  64},  {0x01FE,  64},
 200 {0x01FE,  64},  {0x01FE,  64},  {0x01FE,  64},  {0x01FE,  64},  {0x01FE,  64},
 201 {0x01FE,  64},  {0x01FE,  64},  {0x01FE,  64},  {0x01FE,  64},  {0x01FE,  64},
 202 {0x01FE,  64},  {0x01FE,  64},  {0x01FE,  64},  {0x01FE,  64},  {0x817E,  64},
 203 {0x817E,  64},  {0xC13E,  64},  {0xC13E,  64},  {0xE11E,  64},  {0xE11E,  64},
 204 {0xF10E,  64},  {0xF10E,  64},  {0xF906,  64},  {0xF906,  64},  {0xFD02,  64},
 205 {0xFD02,  64},  {0xFF00,  64},  {0xFF00,  64},  {0x01FE, 128}
 206};
 207
 208/* table of attenuation values for vertical scaling */
 209static u16 v_attenuation[] = { 2, 4, 8, 16, 32, 64, 128, 256, 0};
 210
 211/* calculate vertical scale registers */
 212static int calculate_v_scale_registers(struct saa7146_dev *dev, enum v4l2_field field,
 213        int in_y, int out_y, u32* hps_v_scale, u32* hps_v_gain)
 214{
 215        int lpi = 0;
 216
 217        /* vertical scaling */
 218        u32 yacm = 0, ysci = 0, yacl = 0, ypo = 0, ype = 0;
 219        /* vertical scale & gain */
 220        u32 dcgy = 0, cya_cyb = 0;
 221
 222        /* helper variables */
 223        u32 v_atten = 0, i = 0;
 224
 225        /* error, if vertical zooming */
 226        if ( in_y < out_y ) {
 227                return -EINVAL;
 228        }
 229
 230        /* linear phase interpolation may be used
 231           if scaling is between 1 and 1/2 (both fields used)
 232           or scaling is between 1/2 and 1/4 (if only one field is used) */
 233
 234        if (V4L2_FIELD_HAS_BOTH(field)) {
 235                if( 2*out_y >= in_y) {
 236                        lpi = 1;
 237                }
 238        } else if (field == V4L2_FIELD_TOP
 239                || field == V4L2_FIELD_ALTERNATE
 240                || field == V4L2_FIELD_BOTTOM) {
 241                if( 4*out_y >= in_y ) {
 242                        lpi = 1;
 243                }
 244                out_y *= 2;
 245        }
 246        if( 0 != lpi ) {
 247
 248                yacm = 0;
 249                yacl = 0;
 250                cya_cyb = 0x00ff;
 251
 252                /* calculate scaling increment */
 253                if ( in_y > out_y )
 254                        ysci = ((1024 * in_y) / (out_y + 1)) - 1024;
 255                else
 256                        ysci = 0;
 257
 258                dcgy = 0;
 259
 260                /* calculate ype and ypo */
 261                ype = ysci / 16;
 262                ypo = ype + (ysci / 64);
 263
 264        } else {
 265                yacm = 1;
 266
 267                /* calculate scaling increment */
 268                ysci = (((10 * 1024 * (in_y - out_y - 1)) / in_y) + 9) / 10;
 269
 270                /* calculate ype and ypo */
 271                ypo = ype = ((ysci + 15) / 16);
 272
 273                /* the sequence length interval (yacl) has to be set according
 274                   to the prescale value, e.g.  [n   .. 1/2) : 0
 275                                                [1/2 .. 1/3) : 1
 276                                                [1/3 .. 1/4) : 2
 277                                                ... */
 278                if ( ysci < 512) {
 279                        yacl = 0;
 280                } else {
 281                        yacl = ( ysci / (1024 - ysci) );
 282                }
 283
 284                /* get filter coefficients for cya, cyb from table hps_v_coeff_tab */
 285                cya_cyb = hps_v_coeff_tab[ (yacl < 63 ? yacl : 63 ) ].hps_coeff;
 286
 287                /* get best match in the table of attenuations for vertical scaling */
 288                v_atten = hps_v_coeff_tab[ (yacl < 63 ? yacl : 63 ) ].weight_sum;
 289
 290                for (i = 0; v_attenuation[i] != 0; i++) {
 291                        if (v_attenuation[i] >= v_atten)
 292                                break;
 293                }
 294
 295                dcgy = i;
 296        }
 297
 298        /* ypo and ype swapped in spec ? */
 299        *hps_v_scale    |= (yacm << 31) | (ysci << 21) | (yacl << 15) | (ypo << 8 ) | (ype << 1);
 300
 301        *hps_v_gain     &= ~(MASK_W0|MASK_B2);
 302        *hps_v_gain     |= (dcgy << 16) | (cya_cyb << 0);
 303
 304        return 0;
 305}
 306
 307/* simple bubble-sort algorithm with duplicate elimination */
 308static int sort_and_eliminate(u32* values, int* count)
 309{
 310        int low = 0, high = 0, top = 0;
 311        int cur = 0, next = 0;
 312
 313        /* sanity checks */
 314        if( (0 > *count) || (NULL == values) ) {
 315                return -EINVAL;
 316        }
 317
 318        /* bubble sort the first @count items of the array @values */
 319        for( top = *count; top > 0; top--) {
 320                for( low = 0, high = 1; high < top; low++, high++) {
 321                        if( values[low] > values[high] )
 322                                swap(values[low], values[high]);
 323                }
 324        }
 325
 326        /* remove duplicate items */
 327        for( cur = 0, next = 1; next < *count; next++) {
 328                if( values[cur] != values[next])
 329                        values[++cur] = values[next];
 330        }
 331
 332        *count = cur + 1;
 333
 334        return 0;
 335}
 336
 337static void calculate_clipping_registers_rect(struct saa7146_dev *dev, struct saa7146_fh *fh,
 338        struct saa7146_video_dma *vdma2, u32* clip_format, u32* arbtr_ctrl, enum v4l2_field field)
 339{
 340        struct saa7146_vv *vv = dev->vv_data;
 341        __le32 *clipping = vv->d_clipping.cpu_addr;
 342
 343        int width = vv->ov.win.w.width;
 344        int height =  vv->ov.win.w.height;
 345        int clipcount = vv->ov.nclips;
 346
 347        u32 line_list[32];
 348        u32 pixel_list[32];
 349        int numdwords = 0;
 350
 351        int i = 0, j = 0;
 352        int cnt_line = 0, cnt_pixel = 0;
 353
 354        int x[32], y[32], w[32], h[32];
 355
 356        /* clear out memory */
 357        memset(&line_list[0],  0x00, sizeof(u32)*32);
 358        memset(&pixel_list[0], 0x00, sizeof(u32)*32);
 359        memset(clipping,  0x00, SAA7146_CLIPPING_MEM);
 360
 361        /* fill the line and pixel-lists */
 362        for(i = 0; i < clipcount; i++) {
 363                int l = 0, r = 0, t = 0, b = 0;
 364
 365                x[i] = vv->ov.clips[i].c.left;
 366                y[i] = vv->ov.clips[i].c.top;
 367                w[i] = vv->ov.clips[i].c.width;
 368                h[i] = vv->ov.clips[i].c.height;
 369
 370                if( w[i] < 0) {
 371                        x[i] += w[i]; w[i] = -w[i];
 372                }
 373                if( h[i] < 0) {
 374                        y[i] += h[i]; h[i] = -h[i];
 375                }
 376                if( x[i] < 0) {
 377                        w[i] += x[i]; x[i] = 0;
 378                }
 379                if( y[i] < 0) {
 380                        h[i] += y[i]; y[i] = 0;
 381                }
 382                if( 0 != vv->vflip ) {
 383                        y[i] = height - y[i] - h[i];
 384                }
 385
 386                l = x[i];
 387                r = x[i]+w[i];
 388                t = y[i];
 389                b = y[i]+h[i];
 390
 391                /* insert left/right coordinates */
 392                pixel_list[ 2*i   ] = min_t(int, l, width);
 393                pixel_list[(2*i)+1] = min_t(int, r, width);
 394                /* insert top/bottom coordinates */
 395                line_list[ 2*i   ] = min_t(int, t, height);
 396                line_list[(2*i)+1] = min_t(int, b, height);
 397        }
 398
 399        /* sort and eliminate lists */
 400        cnt_line = cnt_pixel = 2*clipcount;
 401        sort_and_eliminate( &pixel_list[0], &cnt_pixel );
 402        sort_and_eliminate( &line_list[0], &cnt_line );
 403
 404        /* calculate the number of used u32s */
 405        numdwords = max_t(int, (cnt_line+1), (cnt_pixel+1))*2;
 406        numdwords = max_t(int, 4, numdwords);
 407        numdwords = min_t(int, 64, numdwords);
 408
 409        /* fill up cliptable */
 410        for(i = 0; i < cnt_pixel; i++) {
 411                clipping[2*i] |= cpu_to_le32(pixel_list[i] << 16);
 412        }
 413        for(i = 0; i < cnt_line; i++) {
 414                clipping[(2*i)+1] |= cpu_to_le32(line_list[i] << 16);
 415        }
 416
 417        /* fill up cliptable with the display infos */
 418        for(j = 0; j < clipcount; j++) {
 419
 420                for(i = 0; i < cnt_pixel; i++) {
 421
 422                        if( x[j] < 0)
 423                                x[j] = 0;
 424
 425                        if( pixel_list[i] < (x[j] + w[j])) {
 426
 427                                if ( pixel_list[i] >= x[j] ) {
 428                                        clipping[2*i] |= cpu_to_le32(1 << j);
 429                                }
 430                        }
 431                }
 432                for(i = 0; i < cnt_line; i++) {
 433
 434                        if( y[j] < 0)
 435                                y[j] = 0;
 436
 437                        if( line_list[i] < (y[j] + h[j]) ) {
 438
 439                                if( line_list[i] >= y[j] ) {
 440                                        clipping[(2*i)+1] |= cpu_to_le32(1 << j);
 441                                }
 442                        }
 443                }
 444        }
 445
 446        /* adjust arbitration control register */
 447        *arbtr_ctrl &= 0xffff00ff;
 448        *arbtr_ctrl |= 0x00001c00;
 449
 450        vdma2->base_even        = vv->d_clipping.dma_handle;
 451        vdma2->base_odd         = vv->d_clipping.dma_handle;
 452        vdma2->prot_addr        = vv->d_clipping.dma_handle+((sizeof(u32))*(numdwords));
 453        vdma2->base_page        = 0x04;
 454        vdma2->pitch            = 0x00;
 455        vdma2->num_line_byte    = (0 << 16 | (sizeof(u32))*(numdwords-1) );
 456
 457        /* set clipping-mode. this depends on the field(s) used */
 458        *clip_format &= 0xfffffff7;
 459        if (V4L2_FIELD_HAS_BOTH(field)) {
 460                *clip_format |= 0x00000008;
 461        } else {
 462                *clip_format |= 0x00000000;
 463        }
 464}
 465
 466/* disable clipping */
 467static void saa7146_disable_clipping(struct saa7146_dev *dev)
 468{
 469        u32 clip_format = saa7146_read(dev, CLIP_FORMAT_CTRL);
 470
 471        /* mask out relevant bits (=lower word)*/
 472        clip_format &= MASK_W1;
 473
 474        /* upload clipping-registers*/
 475        saa7146_write(dev, CLIP_FORMAT_CTRL,clip_format);
 476        saa7146_write(dev, MC2, (MASK_05 | MASK_21));
 477
 478        /* disable video dma2 */
 479        saa7146_write(dev, MC1, MASK_21);
 480}
 481
 482static void saa7146_set_clipping_rect(struct saa7146_fh *fh)
 483{
 484        struct saa7146_dev *dev = fh->dev;
 485        struct saa7146_vv *vv = dev->vv_data;
 486        enum v4l2_field field = vv->ov.win.field;
 487        struct  saa7146_video_dma vdma2;
 488        u32 clip_format;
 489        u32 arbtr_ctrl;
 490
 491        /* check clipcount, disable clipping if clipcount == 0*/
 492        if (vv->ov.nclips == 0) {
 493                saa7146_disable_clipping(dev);
 494                return;
 495        }
 496
 497        clip_format = saa7146_read(dev, CLIP_FORMAT_CTRL);
 498        arbtr_ctrl = saa7146_read(dev, PCI_BT_V1);
 499
 500        calculate_clipping_registers_rect(dev, fh, &vdma2, &clip_format, &arbtr_ctrl, field);
 501
 502        /* set clipping format */
 503        clip_format &= 0xffff0008;
 504        clip_format |= (SAA7146_CLIPPING_RECT << 4);
 505
 506        /* prepare video dma2 */
 507        saa7146_write(dev, BASE_EVEN2,          vdma2.base_even);
 508        saa7146_write(dev, BASE_ODD2,           vdma2.base_odd);
 509        saa7146_write(dev, PROT_ADDR2,          vdma2.prot_addr);
 510        saa7146_write(dev, BASE_PAGE2,          vdma2.base_page);
 511        saa7146_write(dev, PITCH2,              vdma2.pitch);
 512        saa7146_write(dev, NUM_LINE_BYTE2,      vdma2.num_line_byte);
 513
 514        /* prepare the rest */
 515        saa7146_write(dev, CLIP_FORMAT_CTRL,clip_format);
 516        saa7146_write(dev, PCI_BT_V1, arbtr_ctrl);
 517
 518        /* upload clip_control-register, clipping-registers, enable video dma2 */
 519        saa7146_write(dev, MC2, (MASK_05 | MASK_21 | MASK_03 | MASK_19));
 520        saa7146_write(dev, MC1, (MASK_05 | MASK_21));
 521}
 522
 523static void saa7146_set_window(struct saa7146_dev *dev, int width, int height, enum v4l2_field field)
 524{
 525        struct saa7146_vv *vv = dev->vv_data;
 526
 527        int source = vv->current_hps_source;
 528        int sync = vv->current_hps_sync;
 529
 530        u32 hps_v_scale = 0, hps_v_gain  = 0, hps_ctrl = 0, hps_h_prescale = 0, hps_h_scale = 0;
 531
 532        /* set vertical scale */
 533        hps_v_scale = 0; /* all bits get set by the function-call */
 534        hps_v_gain  = 0; /* fixme: saa7146_read(dev, HPS_V_GAIN);*/
 535        calculate_v_scale_registers(dev, field, vv->standard->v_field*2, height, &hps_v_scale, &hps_v_gain);
 536
 537        /* set horizontal scale */
 538        hps_ctrl        = 0;
 539        hps_h_prescale  = 0; /* all bits get set in the function */
 540        hps_h_scale     = 0;
 541        calculate_h_scale_registers(dev, vv->standard->h_pixels, width, vv->hflip, &hps_ctrl, &hps_v_gain, &hps_h_prescale, &hps_h_scale);
 542
 543        /* set hyo and hxo */
 544        calculate_hxo_and_hyo(vv, &hps_h_scale, &hps_ctrl);
 545        calculate_hps_source_and_sync(dev, source, sync, &hps_ctrl);
 546
 547        /* write out new register contents */
 548        saa7146_write(dev, HPS_V_SCALE, hps_v_scale);
 549        saa7146_write(dev, HPS_V_GAIN,  hps_v_gain);
 550        saa7146_write(dev, HPS_CTRL,    hps_ctrl);
 551        saa7146_write(dev, HPS_H_PRESCALE,hps_h_prescale);
 552        saa7146_write(dev, HPS_H_SCALE, hps_h_scale);
 553
 554        /* upload shadow-ram registers */
 555        saa7146_write(dev, MC2, (MASK_05 | MASK_06 | MASK_21 | MASK_22) );
 556}
 557
 558/* calculate the new memory offsets for a desired position */
 559static void saa7146_set_position(struct saa7146_dev *dev, int w_x, int w_y, int w_height, enum v4l2_field field, u32 pixelformat)
 560{
 561        struct saa7146_vv *vv = dev->vv_data;
 562        struct saa7146_format *sfmt = saa7146_format_by_fourcc(dev, pixelformat);
 563
 564        int b_depth = vv->ov_fmt->depth;
 565        int b_bpl = vv->ov_fb.fmt.bytesperline;
 566        /* The unsigned long cast is to remove a 64-bit compile warning since
 567           it looks like a 64-bit address is cast to a 32-bit value, even
 568           though the base pointer is really a 32-bit physical address that
 569           goes into a 32-bit DMA register.
 570           FIXME: might not work on some 64-bit platforms, but see the FIXME
 571           in struct v4l2_framebuffer (videodev2.h) for that.
 572         */
 573        u32 base = (u32)(unsigned long)vv->ov_fb.base;
 574
 575        struct  saa7146_video_dma vdma1;
 576
 577        /* calculate memory offsets for picture, look if we shall top-down-flip */
 578        vdma1.pitch     = 2*b_bpl;
 579        if ( 0 == vv->vflip ) {
 580                vdma1.base_even = base + (w_y * (vdma1.pitch/2)) + (w_x * (b_depth / 8));
 581                vdma1.base_odd  = vdma1.base_even + (vdma1.pitch / 2);
 582                vdma1.prot_addr = vdma1.base_even + (w_height * (vdma1.pitch / 2));
 583        }
 584        else {
 585                vdma1.base_even = base + ((w_y+w_height) * (vdma1.pitch/2)) + (w_x * (b_depth / 8));
 586                vdma1.base_odd  = vdma1.base_even - (vdma1.pitch / 2);
 587                vdma1.prot_addr = vdma1.base_odd - (w_height * (vdma1.pitch / 2));
 588        }
 589
 590        if (V4L2_FIELD_HAS_BOTH(field)) {
 591        } else if (field == V4L2_FIELD_ALTERNATE) {
 592                /* fixme */
 593                vdma1.base_odd = vdma1.prot_addr;
 594                vdma1.pitch /= 2;
 595        } else if (field == V4L2_FIELD_TOP) {
 596                vdma1.base_odd = vdma1.prot_addr;
 597                vdma1.pitch /= 2;
 598        } else if (field == V4L2_FIELD_BOTTOM) {
 599                vdma1.base_odd = vdma1.base_even;
 600                vdma1.base_even = vdma1.prot_addr;
 601                vdma1.pitch /= 2;
 602        }
 603
 604        if ( 0 != vv->vflip ) {
 605                vdma1.pitch *= -1;
 606        }
 607
 608        vdma1.base_page = sfmt->swap;
 609        vdma1.num_line_byte = (vv->standard->v_field<<16)+vv->standard->h_pixels;
 610
 611        saa7146_write_out_dma(dev, 1, &vdma1);
 612}
 613
 614static void saa7146_set_output_format(struct saa7146_dev *dev, unsigned long palette)
 615{
 616        u32 clip_format = saa7146_read(dev, CLIP_FORMAT_CTRL);
 617
 618        /* call helper function */
 619        calculate_output_format_register(dev,palette,&clip_format);
 620
 621        /* update the hps registers */
 622        saa7146_write(dev, CLIP_FORMAT_CTRL, clip_format);
 623        saa7146_write(dev, MC2, (MASK_05 | MASK_21));
 624}
 625
 626/* select input-source */
 627void saa7146_set_hps_source_and_sync(struct saa7146_dev *dev, int source, int sync)
 628{
 629        struct saa7146_vv *vv = dev->vv_data;
 630        u32 hps_ctrl = 0;
 631
 632        /* read old state */
 633        hps_ctrl = saa7146_read(dev, HPS_CTRL);
 634
 635        hps_ctrl &= ~( MASK_31 | MASK_30 | MASK_28 );
 636        hps_ctrl |= (source << 30) | (sync << 28);
 637
 638        /* write back & upload register */
 639        saa7146_write(dev, HPS_CTRL, hps_ctrl);
 640        saa7146_write(dev, MC2, (MASK_05 | MASK_21));
 641
 642        vv->current_hps_source = source;
 643        vv->current_hps_sync = sync;
 644}
 645EXPORT_SYMBOL_GPL(saa7146_set_hps_source_and_sync);
 646
 647int saa7146_enable_overlay(struct saa7146_fh *fh)
 648{
 649        struct saa7146_dev *dev = fh->dev;
 650        struct saa7146_vv *vv = dev->vv_data;
 651
 652        saa7146_set_window(dev, vv->ov.win.w.width, vv->ov.win.w.height, vv->ov.win.field);
 653        saa7146_set_position(dev, vv->ov.win.w.left, vv->ov.win.w.top, vv->ov.win.w.height, vv->ov.win.field, vv->ov_fmt->pixelformat);
 654        saa7146_set_output_format(dev, vv->ov_fmt->trans);
 655        saa7146_set_clipping_rect(fh);
 656
 657        /* enable video dma1 */
 658        saa7146_write(dev, MC1, (MASK_06 | MASK_22));
 659        return 0;
 660}
 661
 662void saa7146_disable_overlay(struct saa7146_fh *fh)
 663{
 664        struct saa7146_dev *dev = fh->dev;
 665
 666        /* disable clipping + video dma1 */
 667        saa7146_disable_clipping(dev);
 668        saa7146_write(dev, MC1, MASK_22);
 669}
 670
 671void saa7146_write_out_dma(struct saa7146_dev* dev, int which, struct saa7146_video_dma* vdma)
 672{
 673        int where = 0;
 674
 675        if( which < 1 || which > 3) {
 676                return;
 677        }
 678
 679        /* calculate starting address */
 680        where  = (which-1)*0x18;
 681
 682        saa7146_write(dev, where,       vdma->base_odd);
 683        saa7146_write(dev, where+0x04,  vdma->base_even);
 684        saa7146_write(dev, where+0x08,  vdma->prot_addr);
 685        saa7146_write(dev, where+0x0c,  vdma->pitch);
 686        saa7146_write(dev, where+0x10,  vdma->base_page);
 687        saa7146_write(dev, where+0x14,  vdma->num_line_byte);
 688
 689        /* upload */
 690        saa7146_write(dev, MC2, (MASK_02<<(which-1))|(MASK_18<<(which-1)));
 691/*
 692        printk("vdma%d.base_even:     0x%08x\n", which,vdma->base_even);
 693        printk("vdma%d.base_odd:      0x%08x\n", which,vdma->base_odd);
 694        printk("vdma%d.prot_addr:     0x%08x\n", which,vdma->prot_addr);
 695        printk("vdma%d.base_page:     0x%08x\n", which,vdma->base_page);
 696        printk("vdma%d.pitch:         0x%08x\n", which,vdma->pitch);
 697        printk("vdma%d.num_line_byte: 0x%08x\n", which,vdma->num_line_byte);
 698*/
 699}
 700
 701static int calculate_video_dma_grab_packed(struct saa7146_dev* dev, struct saa7146_buf *buf)
 702{
 703        struct saa7146_vv *vv = dev->vv_data;
 704        struct saa7146_video_dma vdma1;
 705
 706        struct saa7146_format *sfmt = saa7146_format_by_fourcc(dev,buf->fmt->pixelformat);
 707
 708        int width = buf->fmt->width;
 709        int height = buf->fmt->height;
 710        int bytesperline = buf->fmt->bytesperline;
 711        enum v4l2_field field = buf->fmt->field;
 712
 713        int depth = sfmt->depth;
 714
 715        DEB_CAP("[size=%dx%d,fields=%s]\n",
 716                width, height, v4l2_field_names[field]);
 717
 718        if( bytesperline != 0) {
 719                vdma1.pitch = bytesperline*2;
 720        } else {
 721                vdma1.pitch = (width*depth*2)/8;
 722        }
 723        vdma1.num_line_byte     = ((vv->standard->v_field<<16) + vv->standard->h_pixels);
 724        vdma1.base_page         = buf->pt[0].dma | ME1 | sfmt->swap;
 725
 726        if( 0 != vv->vflip ) {
 727                vdma1.prot_addr = buf->pt[0].offset;
 728                vdma1.base_even = buf->pt[0].offset+(vdma1.pitch/2)*height;
 729                vdma1.base_odd  = vdma1.base_even - (vdma1.pitch/2);
 730        } else {
 731                vdma1.base_even = buf->pt[0].offset;
 732                vdma1.base_odd  = vdma1.base_even + (vdma1.pitch/2);
 733                vdma1.prot_addr = buf->pt[0].offset+(vdma1.pitch/2)*height;
 734        }
 735
 736        if (V4L2_FIELD_HAS_BOTH(field)) {
 737        } else if (field == V4L2_FIELD_ALTERNATE) {
 738                /* fixme */
 739                if ( vv->last_field == V4L2_FIELD_TOP ) {
 740                        vdma1.base_odd  = vdma1.prot_addr;
 741                        vdma1.pitch /= 2;
 742                } else if ( vv->last_field == V4L2_FIELD_BOTTOM ) {
 743                        vdma1.base_odd  = vdma1.base_even;
 744                        vdma1.base_even = vdma1.prot_addr;
 745                        vdma1.pitch /= 2;
 746                }
 747        } else if (field == V4L2_FIELD_TOP) {
 748                vdma1.base_odd  = vdma1.prot_addr;
 749                vdma1.pitch /= 2;
 750        } else if (field == V4L2_FIELD_BOTTOM) {
 751                vdma1.base_odd  = vdma1.base_even;
 752                vdma1.base_even = vdma1.prot_addr;
 753                vdma1.pitch /= 2;
 754        }
 755
 756        if( 0 != vv->vflip ) {
 757                vdma1.pitch *= -1;
 758        }
 759
 760        saa7146_write_out_dma(dev, 1, &vdma1);
 761        return 0;
 762}
 763
 764static int calc_planar_422(struct saa7146_vv *vv, struct saa7146_buf *buf, struct saa7146_video_dma *vdma2, struct saa7146_video_dma *vdma3)
 765{
 766        int height = buf->fmt->height;
 767        int width = buf->fmt->width;
 768
 769        vdma2->pitch    = width;
 770        vdma3->pitch    = width;
 771
 772        /* fixme: look at bytesperline! */
 773
 774        if( 0 != vv->vflip ) {
 775                vdma2->prot_addr        = buf->pt[1].offset;
 776                vdma2->base_even        = ((vdma2->pitch/2)*height)+buf->pt[1].offset;
 777                vdma2->base_odd         = vdma2->base_even - (vdma2->pitch/2);
 778
 779                vdma3->prot_addr        = buf->pt[2].offset;
 780                vdma3->base_even        = ((vdma3->pitch/2)*height)+buf->pt[2].offset;
 781                vdma3->base_odd         = vdma3->base_even - (vdma3->pitch/2);
 782        } else {
 783                vdma3->base_even        = buf->pt[2].offset;
 784                vdma3->base_odd         = vdma3->base_even + (vdma3->pitch/2);
 785                vdma3->prot_addr        = (vdma3->pitch/2)*height+buf->pt[2].offset;
 786
 787                vdma2->base_even        = buf->pt[1].offset;
 788                vdma2->base_odd         = vdma2->base_even + (vdma2->pitch/2);
 789                vdma2->prot_addr        = (vdma2->pitch/2)*height+buf->pt[1].offset;
 790        }
 791
 792        return 0;
 793}
 794
 795static int calc_planar_420(struct saa7146_vv *vv, struct saa7146_buf *buf, struct saa7146_video_dma *vdma2, struct saa7146_video_dma *vdma3)
 796{
 797        int height = buf->fmt->height;
 798        int width = buf->fmt->width;
 799
 800        vdma2->pitch    = width/2;
 801        vdma3->pitch    = width/2;
 802
 803        if( 0 != vv->vflip ) {
 804                vdma2->prot_addr        = buf->pt[2].offset;
 805                vdma2->base_even        = ((vdma2->pitch/2)*height)+buf->pt[2].offset;
 806                vdma2->base_odd         = vdma2->base_even - (vdma2->pitch/2);
 807
 808                vdma3->prot_addr        = buf->pt[1].offset;
 809                vdma3->base_even        = ((vdma3->pitch/2)*height)+buf->pt[1].offset;
 810                vdma3->base_odd         = vdma3->base_even - (vdma3->pitch/2);
 811
 812        } else {
 813                vdma3->base_even        = buf->pt[2].offset;
 814                vdma3->base_odd         = vdma3->base_even + (vdma3->pitch);
 815                vdma3->prot_addr        = (vdma3->pitch/2)*height+buf->pt[2].offset;
 816
 817                vdma2->base_even        = buf->pt[1].offset;
 818                vdma2->base_odd         = vdma2->base_even + (vdma2->pitch);
 819                vdma2->prot_addr        = (vdma2->pitch/2)*height+buf->pt[1].offset;
 820        }
 821        return 0;
 822}
 823
 824static int calculate_video_dma_grab_planar(struct saa7146_dev* dev, struct saa7146_buf *buf)
 825{
 826        struct saa7146_vv *vv = dev->vv_data;
 827        struct saa7146_video_dma vdma1;
 828        struct saa7146_video_dma vdma2;
 829        struct saa7146_video_dma vdma3;
 830
 831        struct saa7146_format *sfmt = saa7146_format_by_fourcc(dev,buf->fmt->pixelformat);
 832
 833        int width = buf->fmt->width;
 834        int height = buf->fmt->height;
 835        enum v4l2_field field = buf->fmt->field;
 836
 837        BUG_ON(0 == buf->pt[0].dma);
 838        BUG_ON(0 == buf->pt[1].dma);
 839        BUG_ON(0 == buf->pt[2].dma);
 840
 841        DEB_CAP("[size=%dx%d,fields=%s]\n",
 842                width, height, v4l2_field_names[field]);
 843
 844        /* fixme: look at bytesperline! */
 845
 846        /* fixme: what happens for user space buffers here?. The offsets are
 847           most likely wrong, this version here only works for page-aligned
 848           buffers, modifications to the pagetable-functions are necessary...*/
 849
 850        vdma1.pitch             = width*2;
 851        vdma1.num_line_byte     = ((vv->standard->v_field<<16) + vv->standard->h_pixels);
 852        vdma1.base_page         = buf->pt[0].dma | ME1;
 853
 854        if( 0 != vv->vflip ) {
 855                vdma1.prot_addr = buf->pt[0].offset;
 856                vdma1.base_even = ((vdma1.pitch/2)*height)+buf->pt[0].offset;
 857                vdma1.base_odd  = vdma1.base_even - (vdma1.pitch/2);
 858        } else {
 859                vdma1.base_even = buf->pt[0].offset;
 860                vdma1.base_odd  = vdma1.base_even + (vdma1.pitch/2);
 861                vdma1.prot_addr = (vdma1.pitch/2)*height+buf->pt[0].offset;
 862        }
 863
 864        vdma2.num_line_byte     = 0; /* unused */
 865        vdma2.base_page         = buf->pt[1].dma | ME1;
 866
 867        vdma3.num_line_byte     = 0; /* unused */
 868        vdma3.base_page         = buf->pt[2].dma | ME1;
 869
 870        switch( sfmt->depth ) {
 871                case 12: {
 872                        calc_planar_420(vv,buf,&vdma2,&vdma3);
 873                        break;
 874                }
 875                case 16: {
 876                        calc_planar_422(vv,buf,&vdma2,&vdma3);
 877                        break;
 878                }
 879                default: {
 880                        return -1;
 881                }
 882        }
 883
 884        if (V4L2_FIELD_HAS_BOTH(field)) {
 885        } else if (field == V4L2_FIELD_ALTERNATE) {
 886                /* fixme */
 887                vdma1.base_odd  = vdma1.prot_addr;
 888                vdma1.pitch /= 2;
 889                vdma2.base_odd  = vdma2.prot_addr;
 890                vdma2.pitch /= 2;
 891                vdma3.base_odd  = vdma3.prot_addr;
 892                vdma3.pitch /= 2;
 893        } else if (field == V4L2_FIELD_TOP) {
 894                vdma1.base_odd  = vdma1.prot_addr;
 895                vdma1.pitch /= 2;
 896                vdma2.base_odd  = vdma2.prot_addr;
 897                vdma2.pitch /= 2;
 898                vdma3.base_odd  = vdma3.prot_addr;
 899                vdma3.pitch /= 2;
 900        } else if (field == V4L2_FIELD_BOTTOM) {
 901                vdma1.base_odd  = vdma1.base_even;
 902                vdma1.base_even = vdma1.prot_addr;
 903                vdma1.pitch /= 2;
 904                vdma2.base_odd  = vdma2.base_even;
 905                vdma2.base_even = vdma2.prot_addr;
 906                vdma2.pitch /= 2;
 907                vdma3.base_odd  = vdma3.base_even;
 908                vdma3.base_even = vdma3.prot_addr;
 909                vdma3.pitch /= 2;
 910        }
 911
 912        if( 0 != vv->vflip ) {
 913                vdma1.pitch *= -1;
 914                vdma2.pitch *= -1;
 915                vdma3.pitch *= -1;
 916        }
 917
 918        saa7146_write_out_dma(dev, 1, &vdma1);
 919        if( (sfmt->flags & FORMAT_BYTE_SWAP) != 0 ) {
 920                saa7146_write_out_dma(dev, 3, &vdma2);
 921                saa7146_write_out_dma(dev, 2, &vdma3);
 922        } else {
 923                saa7146_write_out_dma(dev, 2, &vdma2);
 924                saa7146_write_out_dma(dev, 3, &vdma3);
 925        }
 926        return 0;
 927}
 928
 929static void program_capture_engine(struct saa7146_dev *dev, int planar)
 930{
 931        struct saa7146_vv *vv = dev->vv_data;
 932        int count = 0;
 933
 934        unsigned long e_wait = vv->current_hps_sync == SAA7146_HPS_SYNC_PORT_A ? CMD_E_FID_A : CMD_E_FID_B;
 935        unsigned long o_wait = vv->current_hps_sync == SAA7146_HPS_SYNC_PORT_A ? CMD_O_FID_A : CMD_O_FID_B;
 936
 937        /* wait for o_fid_a/b / e_fid_a/b toggle only if rps register 0 is not set*/
 938        WRITE_RPS0(CMD_PAUSE | CMD_OAN | CMD_SIG0 | o_wait);
 939        WRITE_RPS0(CMD_PAUSE | CMD_OAN | CMD_SIG0 | e_wait);
 940
 941        /* set rps register 0 */
 942        WRITE_RPS0(CMD_WR_REG | (1 << 8) | (MC2/4));
 943        WRITE_RPS0(MASK_27 | MASK_11);
 944
 945        /* turn on video-dma1 */
 946        WRITE_RPS0(CMD_WR_REG_MASK | (MC1/4));
 947        WRITE_RPS0(MASK_06 | MASK_22);                  /* => mask */
 948        WRITE_RPS0(MASK_06 | MASK_22);                  /* => values */
 949        if( 0 != planar ) {
 950                /* turn on video-dma2 */
 951                WRITE_RPS0(CMD_WR_REG_MASK | (MC1/4));
 952                WRITE_RPS0(MASK_05 | MASK_21);                  /* => mask */
 953                WRITE_RPS0(MASK_05 | MASK_21);                  /* => values */
 954
 955                /* turn on video-dma3 */
 956                WRITE_RPS0(CMD_WR_REG_MASK | (MC1/4));
 957                WRITE_RPS0(MASK_04 | MASK_20);                  /* => mask */
 958                WRITE_RPS0(MASK_04 | MASK_20);                  /* => values */
 959        }
 960
 961        /* wait for o_fid_a/b / e_fid_a/b toggle */
 962        if ( vv->last_field == V4L2_FIELD_INTERLACED ) {
 963                WRITE_RPS0(CMD_PAUSE | o_wait);
 964                WRITE_RPS0(CMD_PAUSE | e_wait);
 965        } else if ( vv->last_field == V4L2_FIELD_TOP ) {
 966                WRITE_RPS0(CMD_PAUSE | (vv->current_hps_sync == SAA7146_HPS_SYNC_PORT_A ? MASK_10 : MASK_09));
 967                WRITE_RPS0(CMD_PAUSE | o_wait);
 968        } else if ( vv->last_field == V4L2_FIELD_BOTTOM ) {
 969                WRITE_RPS0(CMD_PAUSE | (vv->current_hps_sync == SAA7146_HPS_SYNC_PORT_A ? MASK_10 : MASK_09));
 970                WRITE_RPS0(CMD_PAUSE | e_wait);
 971        }
 972
 973        /* turn off video-dma1 */
 974        WRITE_RPS0(CMD_WR_REG_MASK | (MC1/4));
 975        WRITE_RPS0(MASK_22 | MASK_06);                  /* => mask */
 976        WRITE_RPS0(MASK_22);                            /* => values */
 977        if( 0 != planar ) {
 978                /* turn off video-dma2 */
 979                WRITE_RPS0(CMD_WR_REG_MASK | (MC1/4));
 980                WRITE_RPS0(MASK_05 | MASK_21);                  /* => mask */
 981                WRITE_RPS0(MASK_21);                            /* => values */
 982
 983                /* turn off video-dma3 */
 984                WRITE_RPS0(CMD_WR_REG_MASK | (MC1/4));
 985                WRITE_RPS0(MASK_04 | MASK_20);                  /* => mask */
 986                WRITE_RPS0(MASK_20);                            /* => values */
 987        }
 988
 989        /* generate interrupt */
 990        WRITE_RPS0(CMD_INTERRUPT);
 991
 992        /* stop */
 993        WRITE_RPS0(CMD_STOP);
 994}
 995
 996void saa7146_set_capture(struct saa7146_dev *dev, struct saa7146_buf *buf, struct saa7146_buf *next)
 997{
 998        struct saa7146_format *sfmt = saa7146_format_by_fourcc(dev,buf->fmt->pixelformat);
 999        struct saa7146_vv *vv = dev->vv_data;
1000        u32 vdma1_prot_addr;
1001
1002        DEB_CAP("buf:%p, next:%p\n", buf, next);
1003
1004        vdma1_prot_addr = saa7146_read(dev, PROT_ADDR1);
1005        if( 0 == vdma1_prot_addr ) {
1006                /* clear out beginning of streaming bit (rps register 0)*/
1007                DEB_CAP("forcing sync to new frame\n");
1008                saa7146_write(dev, MC2, MASK_27 );
1009        }
1010
1011        saa7146_set_window(dev, buf->fmt->width, buf->fmt->height, buf->fmt->field);
1012        saa7146_set_output_format(dev, sfmt->trans);
1013        saa7146_disable_clipping(dev);
1014
1015        if ( vv->last_field == V4L2_FIELD_INTERLACED ) {
1016        } else if ( vv->last_field == V4L2_FIELD_TOP ) {
1017                vv->last_field = V4L2_FIELD_BOTTOM;
1018        } else if ( vv->last_field == V4L2_FIELD_BOTTOM ) {
1019                vv->last_field = V4L2_FIELD_TOP;
1020        }
1021
1022        if( 0 != IS_PLANAR(sfmt->trans)) {
1023                calculate_video_dma_grab_planar(dev, buf);
1024                program_capture_engine(dev,1);
1025        } else {
1026                calculate_video_dma_grab_packed(dev, buf);
1027                program_capture_engine(dev,0);
1028        }
1029
1030/*
1031        printk("vdma%d.base_even:     0x%08x\n", 1,saa7146_read(dev,BASE_EVEN1));
1032        printk("vdma%d.base_odd:      0x%08x\n", 1,saa7146_read(dev,BASE_ODD1));
1033        printk("vdma%d.prot_addr:     0x%08x\n", 1,saa7146_read(dev,PROT_ADDR1));
1034        printk("vdma%d.base_page:     0x%08x\n", 1,saa7146_read(dev,BASE_PAGE1));
1035        printk("vdma%d.pitch:         0x%08x\n", 1,saa7146_read(dev,PITCH1));
1036        printk("vdma%d.num_line_byte: 0x%08x\n", 1,saa7146_read(dev,NUM_LINE_BYTE1));
1037        printk("vdma%d => vptr      : 0x%08x\n", 1,saa7146_read(dev,PCI_VDP1));
1038*/
1039
1040        /* write the address of the rps-program */
1041        saa7146_write(dev, RPS_ADDR0, dev->d_rps0.dma_handle);
1042
1043        /* turn on rps */
1044        saa7146_write(dev, MC1, (MASK_12 | MASK_28));
1045}
1046