1 /*****************************************************************************
2 * i420_ymga.c : YUV to YUV conversion module for vlc
3 *****************************************************************************
4 * Copyright (C) 2000, 2001 the VideoLAN team
7 * Authors: Samuel Hocevar <sam@zoy.org>
9 * This program is free software; you can redistribute it and/or modify
10 * it under the terms of the GNU General Public License as published by
11 * the Free Software Foundation; either version 2 of the License, or
12 * (at your option) any later version.
14 * This program is distributed in the hope that it will be useful,
15 * but WITHOUT ANY WARRANTY; without even the implied warranty of
16 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
17 * GNU General Public License for more details.
19 * You should have received a copy of the GNU General Public License
20 * along with this program; if not, write to the Free Software
21 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston MA 02110-1301, USA.
22 *****************************************************************************/
24 /*****************************************************************************
26 *****************************************************************************/
27 #include <errno.h> /* ENOMEM */
33 #include <vlc_common.h>
34 #include <vlc_plugin.h>
35 #include <vlc_filter.h>
38 #define SRC_FOURCC "I420,IYUV,YV12"
39 #define DEST_FOURCC "YMGA"
41 /*****************************************************************************
42 * Local and extern prototypes.
43 *****************************************************************************/
44 static int Activate ( vlc_object_t * );
45 static void I420_YMGA ( filter_t *, picture_t *, picture_t * );
47 /*****************************************************************************
49 *****************************************************************************/
51 #if defined (MODULE_NAME_IS_i420_ymga)
52 set_description( N_("Conversions from " SRC_FOURCC " to " DEST_FOURCC) );
53 set_capability( "chroma", 80 );
54 #elif defined (MODULE_NAME_IS_i420_ymga_mmx)
55 set_description( N_("MMX conversions from " SRC_FOURCC " to " DEST_FOURCC) );
56 set_capability( "chroma", 100 );
57 add_requirement( MMX );
59 set_callbacks( Activate, NULL );
62 /*****************************************************************************
63 * Activate: allocate a chroma function
64 *****************************************************************************
65 * This function allocates and initializes a chroma function
66 *****************************************************************************/
67 static int Activate( vlc_object_t *p_this )
69 filter_t *p_filter = (filter_t *)p_this;
71 if( p_filter->fmt_in.video.i_width & 1
72 || p_filter->fmt_in.video.i_height & 1 )
77 switch( p_filter->fmt_in.video.i_chroma )
79 case VLC_FOURCC('Y','V','1','2'):
80 case VLC_FOURCC('I','4','2','0'):
81 case VLC_FOURCC('I','Y','U','V'):
82 switch( p_filter->fmt_out.video.i_chroma )
84 case VLC_FOURCC('Y','M','G','A'):
85 p_filter->pf_video_filter_io = I420_YMGA;
100 /* Following functions are local */
102 /*****************************************************************************
103 * I420_YMGA: planar YUV 4:2:0 to Matrox's planar/packed YUV 4:2:0
104 *****************************************************************************/
105 static void I420_YMGA( filter_t *p_filter, picture_t *p_source,
108 uint8_t *p_uv = p_dest->U_PIXELS;
109 uint8_t *p_u = p_source->U_PIXELS;
110 uint8_t *p_v = p_source->V_PIXELS;
114 /* Copy the Y part */
115 vlc_memcpy( p_dest->Y_PIXELS, p_source->Y_PIXELS,
116 p_dest->p[Y_PLANE].i_pitch * p_dest->p[Y_PLANE].i_visible_lines );
118 /* Copy the U:V part */
119 for( i_x = p_dest->p[U_PLANE].i_pitch * p_dest->p[U_PLANE].i_visible_lines / 64;
122 #if defined (MODULE_NAME_IS_i420_ymga)
123 *p_uv++ = *p_u++; *p_uv++ = *p_v++; *p_uv++ = *p_u++; *p_uv++ = *p_v++;
124 *p_uv++ = *p_u++; *p_uv++ = *p_v++; *p_uv++ = *p_u++; *p_uv++ = *p_v++;
125 *p_uv++ = *p_u++; *p_uv++ = *p_v++; *p_uv++ = *p_u++; *p_uv++ = *p_v++;
126 *p_uv++ = *p_u++; *p_uv++ = *p_v++; *p_uv++ = *p_u++; *p_uv++ = *p_v++;
127 *p_uv++ = *p_u++; *p_uv++ = *p_v++; *p_uv++ = *p_u++; *p_uv++ = *p_v++;
128 *p_uv++ = *p_u++; *p_uv++ = *p_v++; *p_uv++ = *p_u++; *p_uv++ = *p_v++;
129 *p_uv++ = *p_u++; *p_uv++ = *p_v++; *p_uv++ = *p_u++; *p_uv++ = *p_v++;
130 *p_uv++ = *p_u++; *p_uv++ = *p_v++; *p_uv++ = *p_u++; *p_uv++ = *p_v++;
132 __asm__( ".p2align 5 \n\
133 movd (%0), %%mm0 # Load 4 Cr 00 00 00 00 v3 v2 v1 v0 \n\
134 movd 4(%0), %%mm2 # Load 4 Cr 00 00 00 00 v3 v2 v1 v0 \n\
135 movd 8(%0), %%mm4 # Load 4 Cr 00 00 00 00 v3 v2 v1 v0 \n\
136 movd 12(%0), %%mm6 # Load 4 Cr 00 00 00 00 v3 v2 v1 v0 \n\
137 movd (%1), %%mm1 # Load 4 Cb 00 00 00 00 u3 u2 u1 u0 \n\
138 movd 4(%1), %%mm3 # Load 4 Cb 00 00 00 00 u3 u2 u1 u0 \n\
139 movd 8(%1), %%mm5 # Load 4 Cb 00 00 00 00 u3 u2 u1 u0 \n\
140 movd 12(%1), %%mm7 # Load 4 Cb 00 00 00 00 u3 u2 u1 u0 \n\
141 punpcklbw %%mm1, %%mm0 # u3 v3 u2 v2 u1 v1 u0 v0 \n\
142 punpcklbw %%mm3, %%mm2 # u3 v3 u2 v2 u1 v1 u0 v0 \n\
143 punpcklbw %%mm5, %%mm4 # u3 v3 u2 v2 u1 v1 u0 v0 \n\
144 punpcklbw %%mm7, %%mm6 # u3 v3 u2 v2 u1 v1 u0 v0 \n\
145 movq %%mm0, (%2) # Store CrCb \n\
146 movq %%mm2, 8(%2) # Store CrCb \n\
147 movq %%mm4, 16(%2) # Store CrCb \n\
148 movq %%mm6, 24(%2) # Store CrCb"
149 : : "r" (p_v), "r" (p_u), "r" (p_uv) );
151 p_v += 16; p_u += 16; p_uv += 32;