diff -urN MPlayer-1.0pre5.old/libvo/vo_x11.c MPlayer-1.0pre5/libvo/vo_x11.c --- MPlayer-1.0pre5.old/libvo/vo_x11.c 2004-10-15 21:54:24.809523440 -0700 +++ MPlayer-1.0pre5/libvo/vo_x11.c 2004-10-15 21:52:40.178429784 -0700 @@ -39,7 +39,6 @@ #include "sub.h" #include "../postproc/swscale.h" -#include "../postproc/swscale_internal.h" //FIXME #include "../postproc/rgb2rgb.h" #include "../libmpcodecs/vf_scale.h" @@ -49,6 +48,7 @@ #include "../Gui/interface.h" #include "../mplayer.h" #endif +#include "../postproc/swscale_internal.h" //FIXME static vo_info_t info = { "X11 ( XImage/Shm )", diff -urN MPlayer-1.0pre5.old/postproc/swscale.c MPlayer-1.0pre5/postproc/swscale.c --- MPlayer-1.0pre5.old/postproc/swscale.c 2004-10-15 21:54:24.812522984 -0700 +++ MPlayer-1.0pre5/postproc/swscale.c 2004-10-15 21:52:40.181429328 -0700 @@ -1728,7 +1728,7 @@ //FIXME factorize #ifdef HAVE_ALTIVEC - yuv2rgb_altivec_init_tables (c, inv_table); + yuv2rgb_altivec_init_tables (c, inv_table, brightness, contrast, saturation); #endif return 0; } diff -urN MPlayer-1.0pre5.old/postproc/swscale_internal.h MPlayer-1.0pre5/postproc/swscale_internal.h --- MPlayer-1.0pre5.old/postproc/swscale_internal.h 2004-10-15 21:54:24.813522832 -0700 +++ MPlayer-1.0pre5/postproc/swscale_internal.h 2004-10-15 21:55:47.226994080 -0700 @@ -19,6 +19,16 @@ #ifndef SWSCALE_INTERNAL_H #define SWSCALE_INTERNAL_H +#ifdef CONFIG_DARWIN +#define AVV(x...) (x) +#else +#define AVV(x...) {x} +#endif + +#ifdef HAVE_ALTIVEC +#include +#endif + #include "../mp_msg.h" #define MSG_WARN(args...) mp_msg(MSGT_SWS,MSGL_WARN, ##args ) diff -urN MPlayer-1.0pre5.old/postproc/yuv2rgb_altivec.c MPlayer-1.0pre5/postproc/yuv2rgb_altivec.c --- MPlayer-1.0pre5.old/postproc/yuv2rgb_altivec.c 2004-10-15 21:54:24.818522072 -0700 +++ MPlayer-1.0pre5/postproc/yuv2rgb_altivec.c 2004-10-15 21:52:40.185428720 -0700 @@ -64,6 +64,7 @@ */ #include #include +#include #include #include #include "config.h" @@ -118,13 +119,13 @@ */ static const vector unsigned char - perm_rgb_0 = (vector unsigned char)(0x00,0x01,0x10,0x02,0x03,0x11,0x04,0x05, + perm_rgb_0 = (const vector unsigned char)AVV(0x00,0x01,0x10,0x02,0x03,0x11,0x04,0x05, 0x12,0x06,0x07,0x13,0x08,0x09,0x14,0x0a), - perm_rgb_1 = (vector unsigned char)(0x0b,0x15,0x0c,0x0d,0x16,0x0e,0x0f,0x17, + perm_rgb_1 = (const vector unsigned char)AVV(0x0b,0x15,0x0c,0x0d,0x16,0x0e,0x0f,0x17, 0x18,0x19,0x1a,0x1b,0x1c,0x1d,0x1e,0x1f), - perm_rgb_2 = (vector unsigned char)(0x10,0x11,0x12,0x13,0x14,0x15,0x16,0x17, + perm_rgb_2 = (const vector unsigned char)AVV(0x10,0x11,0x12,0x13,0x14,0x15,0x16,0x17, 0x00,0x01,0x18,0x02,0x03,0x19,0x04,0x05), - perm_rgb_3 = (vector unsigned char)(0x1a,0x06,0x07,0x1b,0x08,0x09,0x1c,0x0a, + perm_rgb_3 = (const vector unsigned char)AVV(0x1a,0x06,0x07,0x1b,0x08,0x09,0x1c,0x0a, 0x0b,0x1d,0x0c,0x0d,0x1e,0x0e,0x0f,0x1f); #define vec_merge3(x2,x1,x0,y0,y1,y2) \ @@ -197,39 +198,40 @@ #define vec_unh(x) \ (vector signed short) \ - vec_perm(x,(typeof(x))(0),\ - (vector unsigned char)(0x10,0x00,0x10,0x01,0x10,0x02,0x10,0x03,\ + vec_perm(x,(typeof(x))AVV(0),\ + (vector unsigned char)AVV(0x10,0x00,0x10,0x01,0x10,0x02,0x10,0x03,\ 0x10,0x04,0x10,0x05,0x10,0x06,0x10,0x07)) #define vec_unl(x) \ (vector signed short) \ - vec_perm(x,(typeof(x))(0),\ - (vector unsigned char)(0x10,0x08,0x10,0x09,0x10,0x0A,0x10,0x0B,\ + vec_perm(x,(typeof(x))AVV(0),\ + (vector unsigned char)AVV(0x10,0x08,0x10,0x09,0x10,0x0A,0x10,0x0B,\ 0x10,0x0C,0x10,0x0D,0x10,0x0E,0x10,0x0F)) #define vec_clip(x) \ - vec_max (vec_min (x, (typeof(x))(255)), (typeof(x))(0)) + vec_max (vec_min (x, (typeof(x))AVV(235)), (typeof(x))AVV(16)) #define vec_packclp_a(x,y) \ (vector unsigned char)vec_pack (vec_clip (x), vec_clip (y)) #define vec_packclp(x,y) \ (vector unsigned char)vec_packs \ - ((vector unsigned short)vec_max (x,(vector signed short) (0)), \ - (vector unsigned short)vec_max (y,(vector signed short) (0))) + ((vector unsigned short)vec_max (x,(vector signed short) AVV(0)), \ + (vector unsigned short)vec_max (y,(vector signed short) AVV(0))) -//#define out_pixels(a,b,c,ptr) vec_mstrgb32(typeof(a),((typeof (a))(0)),a,a,a,ptr) +//#define out_pixels(a,b,c,ptr) vec_mstrgb32(typeof(a),((typeof (a))AVV(0)),a,a,a,ptr) -static inline cvtyuvtoRGB (SwsContext *c, +static inline void cvtyuvtoRGB (SwsContext *c, vector signed short Y, vector signed short U, vector signed short V, vector signed short *R, vector signed short *G, vector signed short *B) { vector signed short vx,ux,uvx; Y = vec_mradds (Y, c->CY, c->OY); - - U = vec_sub (U,(vector signed short)(128)); - V = vec_sub (V,(vector signed short)(128)); + U = vec_sub (U,(vector signed short) + vec_splat((vector signed short)AVV(128),0)); + V = vec_sub (V,(vector signed short) + vec_splat((vector signed short)AVV(128),0)); // ux = (CBU*(u<CSHIFT)+0x4000)>>15; ux = vec_sl (U, c->CSHIFT); @@ -323,8 +325,13 @@ align_perm = vec_lvsl (0, vi); \ v = (vector signed char)vec_perm (vivP[0], vivP[1], align_perm); \ \ - u = (vector signed char)vec_sub (u, (vector signed char)(128)); \ - v = (vector signed char)vec_sub (v, (vector signed char)(128)); \ + u = (vector signed char) \ + vec_sub (u,(vector signed char) \ + vec_splat((vector signed char)AVV(128),0));\ + v = (vector signed char) \ + vec_sub (v,(vector signed char) \ + vec_splat((vector signed char)AVV(128),0));\ + \ U = vec_unpackh (u); \ V = vec_unpackh (v); \ \ @@ -341,18 +348,18 @@ \ /* ux = (CBU*(u<>15 */ \ ux = vec_sl (U, lCSHIFT); \ - ux = vec_mradds (ux, lCBU, (vector signed short)(0)); \ + ux = vec_mradds (ux, lCBU, (vector signed short)AVV(0)); \ ux0 = vec_mergeh (ux,ux); \ ux1 = vec_mergel (ux,ux); \ \ /* vx = (CRV*(v<>15; */ \ vx = vec_sl (V, lCSHIFT); \ - vx = vec_mradds (vx, lCRV, (vector signed short)(0)); \ + vx = vec_mradds (vx, lCRV, (vector signed short)AVV(0)); \ vx0 = vec_mergeh (vx,vx); \ vx1 = vec_mergel (vx,vx); \ \ /* uvx = ((CGU*u) + (CGV*v))>>15 */ \ - uvx = vec_mradds (U, lCGU, (vector signed short)(0)); \ + uvx = vec_mradds (U, lCGU, (vector signed short)AVV(0)); \ uvx = vec_mradds (V, lCGV, uvx); \ uvx0 = vec_mergeh (uvx,uvx); \ uvx1 = vec_mergel (uvx,uvx); \ @@ -402,15 +409,167 @@ } -#define out_abgr(a,b,c,ptr) vec_mstrgb32(typeof(a),((typeof (a))(0)),c,b,a,ptr) -#define out_bgra(a,b,c,ptr) vec_mstrgb32(typeof(a),c,b,a,((typeof (a))(0)),ptr) -#define out_rgba(a,b,c,ptr) vec_mstrgb32(typeof(a),a,b,c,((typeof (a))(0)),ptr) -#define out_argb(a,b,c,ptr) vec_mstrgb32(typeof(a),((typeof (a))(0)),a,b,c,ptr) +#define out_abgr(a,b,c,ptr) vec_mstrgb32(typeof(a),((typeof (a))AVV(0)),c,b,a,ptr) +#define out_bgra(a,b,c,ptr) vec_mstrgb32(typeof(a),c,b,a,((typeof (a))AVV(0)),ptr) +#define out_rgba(a,b,c,ptr) vec_mstrgb32(typeof(a),a,b,c,((typeof (a))AVV(0)),ptr) +#define out_argb(a,b,c,ptr) vec_mstrgb32(typeof(a),((typeof (a))AVV(0)),a,b,c,ptr) #define out_rgb24(a,b,c,ptr) vec_mstrgb24(a,b,c,ptr) -#define out_bgr24(a,b,c,ptr) vec_mstrgb24(c,b,a,ptr) +#define out_bgr24(a,b,c,ptr) vec_mstbgr24(c,b,a,ptr) DEFCSP420_CVT (yuv2_abgr32, out_abgr) +#if 1 DEFCSP420_CVT (yuv2_bgra32, out_argb) +#else +static int altivec_yuv2_bgra32 (SwsContext *c, + unsigned char **in, int *instrides, + int srcSliceY, int srcSliceH, + unsigned char **oplanes, int *outstrides) +{ + int w = c->srcW; + int h = srcSliceH; + int i,j; + int instrides_scl[3]; + vector unsigned char y0,y1; + + vector signed char u,v; + + vector signed short Y0,Y1,Y2,Y3; + vector signed short U,V; + vector signed short vx,ux,uvx; + vector signed short vx0,ux0,uvx0; + vector signed short vx1,ux1,uvx1; + vector signed short R0,G0,B0; + vector signed short R1,G1,B1; + vector unsigned char R,G,B; + + vector unsigned char *uivP, *vivP; + vector unsigned char align_perm; + + vector signed short + lCY = c->CY, + lOY = c->OY, + lCRV = c->CRV, + lCBU = c->CBU, + lCGU = c->CGU, + lCGV = c->CGV; + + vector unsigned short lCSHIFT = c->CSHIFT; + + ubyte *y1i = in[0]; + ubyte *y2i = in[0]+w; + ubyte *ui = in[1]; + ubyte *vi = in[2]; + + vector unsigned char *oute + = (vector unsigned char *) + (oplanes[0]+srcSliceY*outstrides[0]); + vector unsigned char *outo + = (vector unsigned char *) + (oplanes[0]+srcSliceY*outstrides[0]+outstrides[0]); + + + instrides_scl[0] = instrides[0]; + instrides_scl[1] = instrides[1]-w/2; /* the loop moves ui by w/2 */ + instrides_scl[2] = instrides[2]-w/2; /* the loop moves vi by w/2 */ + + + for (i=0;i>15 */ + ux = vec_sl (U, lCSHIFT); + ux = vec_mradds (ux, lCBU, (vector signed short)AVV(0)); + ux0 = vec_mergeh (ux,ux); + ux1 = vec_mergel (ux,ux); + + /* vx = (CRV*(v<>15; */ + vx = vec_sl (V, lCSHIFT); + vx = vec_mradds (vx, lCRV, (vector signed short)AVV(0)); + vx0 = vec_mergeh (vx,vx); + vx1 = vec_mergel (vx,vx); + /* uvx = ((CGU*u) + (CGV*v))>>15 */ + uvx = vec_mradds (U, lCGU, (vector signed short)AVV(0)); + uvx = vec_mradds (V, lCGV, uvx); + uvx0 = vec_mergeh (uvx,uvx); + uvx1 = vec_mergel (uvx,uvx); + R0 = vec_add (Y0,vx0); + G0 = vec_add (Y0,uvx0); + B0 = vec_add (Y0,ux0); + R1 = vec_add (Y1,vx1); + G1 = vec_add (Y1,uvx1); + B1 = vec_add (Y1,ux1); + R = vec_packclp (R0,R1); + G = vec_packclp (G0,G1); + B = vec_packclp (B0,B1); + + out_argb(R,G,B,oute); + R0 = vec_add (Y2,vx0); + G0 = vec_add (Y2,uvx0); + B0 = vec_add (Y2,ux0); + R1 = vec_add (Y3,vx1); + G1 = vec_add (Y3,uvx1); + B1 = vec_add (Y3,ux1); + R = vec_packclp (R0,R1); + G = vec_packclp (G0,G1); + B = vec_packclp (B0,B1); + + out_argb(R,G,B,outo); + y1i += 16; + y2i += 16; + ui += 8; + vi += 8; + + } + + outo += (outstrides[0])>>4; + oute += (outstrides[0])>>4; + + ui += instrides_scl[1]; + vi += instrides_scl[2]; + y1i += instrides_scl[0]; + y2i += instrides_scl[0]; + } + return srcSliceH; +} + +#endif + + DEFCSP420_CVT (yuv2_rgba32, out_rgba) DEFCSP420_CVT (yuv2_argb32, out_argb) DEFCSP420_CVT (yuv2_rgb24, out_rgb24) @@ -421,15 +580,15 @@ // 0123 4567 89ab cdef static const vector unsigned char - demux_u = (vector unsigned char)(0x10,0x00,0x10,0x00, + demux_u = (const vector unsigned char)AVV(0x10,0x00,0x10,0x00, 0x10,0x04,0x10,0x04, 0x10,0x08,0x10,0x08, 0x10,0x0c,0x10,0x0c), - demux_v = (vector unsigned char)(0x10,0x02,0x10,0x02, + demux_v = (const vector unsigned char)AVV(0x10,0x02,0x10,0x02, 0x10,0x06,0x10,0x06, 0x10,0x0A,0x10,0x0A, 0x10,0x0E,0x10,0x0E), - demux_y = (vector unsigned char)(0x10,0x01,0x10,0x03, + demux_y = (const vector unsigned char)AVV(0x10,0x01,0x10,0x03, 0x10,0x05,0x10,0x07, 0x10,0x09,0x10,0x0B, 0x10,0x0D,0x10,0x0F); @@ -460,25 +619,25 @@ for (j=0;j RGB32\n"); return altivec_uyvy_rgb32; - case IMGFMT_RGB24: - case IMGFMT_BGR32: - default: return NULL; } break; @@ -565,102 +722,38 @@ return NULL; } - -int yuv2rgb_altivec_init_tables (SwsContext *c, const int inv_table[4]) +void yuv2rgb_altivec_init_tables (SwsContext *c, const int inv_table[4],int brightness,int contrast, int saturation) { - - vector signed short - CY = (vector signed short)(0x7fff), - CRV = (vector signed short)(22972), - CBU = (vector signed short)(29029), - CGU = (vector signed short)(-11276), - CGV = (vector signed short)(-23400), - OY; - - vector unsigned short CSHIFT = (vector unsigned short)(1); - - vector signed short Y0; - int brightness = c->brightness, contrast = c->contrast, saturation = c->saturation; - int64_t crv __attribute__ ((aligned(16))); - int64_t cbu __attribute__ ((aligned(16))); - int64_t cgu __attribute__ ((aligned(16))); - int64_t cgv __attribute__ ((aligned(16))); - short tmp __attribute__ ((aligned(16))); - - int64_t cy = (1<<16)-1; - int64_t oy = 0; - - if ((c->flags & SWS_CPU_CAPS_ALTIVEC) == 0) - return; - - crv = inv_table[0]; - cbu = inv_table[1]; - cgu = inv_table[2]; - cgv = inv_table[3]; - + union { + signed short tmp[8] __attribute__ ((aligned(16))); + vector signed short vec; + } buf; + + buf.tmp[0] = ( (0xffffLL) * contrast>>8 )>>9; //cy + buf.tmp[1] = -256*brightness; //oy + buf.tmp[2] = (inv_table[0]>>3) *(contrast>>16)*(saturation>>16); //crv + buf.tmp[3] = (inv_table[1]>>3) *(contrast>>16)*(saturation>>16); //cbu + buf.tmp[4] = -((inv_table[2]>>1)*(contrast>>16)*(saturation>>16)); //cgu + buf.tmp[5] = -((inv_table[3]>>1)*(contrast>>16)*(saturation>>16)); //cgv + + + c->CSHIFT = (vector unsigned short)vec_splat((vector unsigned short)AVV(2),0); + c->CY = vec_splat ((vector signed short)buf.vec, 0); + c->OY = vec_splat ((vector signed short)buf.vec, 1); + c->CRV = vec_splat ((vector signed short)buf.vec, 2); + c->CBU = vec_splat ((vector signed short)buf.vec, 3); + c->CGU = vec_splat ((vector signed short)buf.vec, 4); + c->CGV = vec_splat ((vector signed short)buf.vec, 5); #if 0 - printf ("crv: %hvx\n", CRV); - printf ("cbu: %hvx\n", CBU); - printf ("cgv: %hvx\n", CGV); - printf ("cgu: %hvx\n", CGU); - - printf ("contrast: %d, brightness: %d, saturation: %d\n", contrast, brightness, saturation); - - printf("%lld %lld %lld %lld %lld\n", cy, crv, cbu, cgu, cgv); -#endif - - cy = (cy *contrast )>>17; - crv= (crv*contrast * saturation)>>32; - cbu= (cbu*contrast * saturation)>>32; - cgu= (cgu*contrast * saturation)>>32; - cgv= (cgv*contrast * saturation)>>32; - - oy -= 256*brightness; - - - //printf("%llx %llx %llx %llx %llx\n", cy, crv, cbu, cgu, cgv); - - // vector signed short CBU,CRV,CGU,CGY,CY; - tmp = cy; - CY = vec_lde (0, &tmp); - CY = vec_splat (CY, 0); - - tmp = oy; - OY = vec_lde (0, &tmp); - OY = vec_splat (OY, 0); - - tmp = crv>>3; - CRV = vec_lde (0, &tmp); - CRV = vec_splat (CRV, 0); - tmp = cbu>>3; - CBU = vec_lde (0, &tmp); - CBU = vec_splat (CBU, 0); - - tmp = -(cgu>>1); - CGU = vec_lde (0, &tmp); - CGU = vec_splat (CGU, 0); - tmp = -(cgv>>1); - CGV = vec_lde (0, &tmp); - CGV = vec_splat (CGV, 0); - - CSHIFT = (vector unsigned short)(2); -#if 1 - c->CSHIFT = CSHIFT; - c->CY = CY; - c->OY = OY; - c->CRV = CRV; - c->CBU = CBU; - c->CGU = CGU; - c->CGV = CGV; -#endif -#if 1 - printf ("cy: %hvx\n", CY); - printf ("oy: %hvx\n", OY); - printf ("crv: %hvx\n", CRV); - printf ("cbu: %hvx\n", CBU); - printf ("cgv: %hvx\n", CGV); - printf ("cgu: %hvx\n", CGU); +{ +int i; +char *v[6]={"cy","oy","crv","cbu","cgu","cgv"}; +for (i=0; i<6;i++) + printf("%s %d ", v[i],buf.tmp[i] ); + printf("\n"); +} #endif + return; } @@ -672,15 +765,16 @@ { int i,j; short tmp __attribute__((aligned (16))); - short *p; + int16_t *p; short *f; vector signed short X,X0,X1,Y0,U0,V0,Y1,U1,V1,U,V; vector signed short R0,G0,B0,R1,G1,B1; vector unsigned char R,G,B,pels[3]; vector unsigned char *out,*nout; - vector signed short RND = (vector signed short)(1<<3); - vector unsigned short SCL = (vector unsigned short)(4); + + vector signed short RND = vec_splat((vector signed short)AVV(1<<3),0); + vector unsigned short SCL = vec_splat((vector unsigned short)AVV(4),0); unsigned long scratch[16] __attribute__ ((aligned (16))); vector signed short *vYCoeffsBank, *vCCoeffsBank; @@ -832,5 +926,3 @@ if (vCCoeffsBank) free (vCCoeffsBank); } - -