Plan 9 from Bell Labs’s /usr/web/sources/contrib/de0u/root/sys/src/cmd/squeak/Cross/plugins/Mpeg3Plugin/libmpeg/video/reconstruct.c

Copyright © 2021 Plan 9 Foundation.
Distributed under the MIT License.
Download the Plan 9 distribution.


/* 
 *
 *  This file is part of libmpeg3
 *	
 * LibMPEG3
 * Author: Adam Williams <[email protected]>
 * Page: heroine.linuxbox.com
 * Page: http://www.smalltalkconsulting.com/html/mpeg3source.html (for Squeak)
 *
    LibMPEG3 was originally licenced under GPL. It was relicensed by
    the author under the LGPL and the Squeak license on Nov 1st, 2000
    
    This library is free software; you can redistribute it and/or
    modify it under the terms of the GNU Lesser General Public
    License as published by the Free Software Foundation; either
    version 2.1 of the License, or (at your option) any later version.

    This library is distributed in the hope that it will be useful,
    but WITHOUT ANY WARRANTY; without even the implied warranty of
    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
    Lesser General Public License for more details.

    You should have received a copy of the GNU Lesser General Public
    License along with this library; if not, write to the Free Software
    Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
    
    Also licensed under the Squeak license.
    http://www.squeak.org/license.html
 */
#include "mpeg3video.h"
#include <stdio.h>

#ifdef HAVE_MMX

#ifdef HAVE_3Dnow
static inline void recva_mmx(unsigned char *s, unsigned char *d, int lx, int lx2, int h)
{
	__asm__(
		".align	8\n"
		"1:"
	   		"movq		(%1),	%%mm0\n"      /* 8 s */
	   		"movq		8(%1),	%%mm1\n"      /* 8 s */
	   		"movq		(%4),	%%mm2\n"      /* 8 s +lx */
	   		"movq		8(%4),	%%mm3\n"      /* 8 s +lx **/

			"pavgusb %%mm2, 	%%mm0\n"
			"addl		%3,		%1\n"
			"pavgusb %%mm3, 	%%mm1\n"

	   		"movq		(%2),	%%mm2\n"      /* 8 d */
	   		"movq		8(%2),	%%mm3\n"      /* 8 d */
			"pavgusb %%mm2, 	%%mm0\n"
			"addl		%3,		%4\n"
			"pavgusb %%mm3, 	%%mm1\n"

			"movq		%%mm0,	(%2)\n"
			"movq		%%mm1,	8(%2)\n"
			"addl		%3,		%2\n"
		"loop		1b\n"
      :
      : "c" (h), "r" (s), "r" (d), "r" (lx2), "r" (s +lx)
	);
}

static inline void recvac_mmx(unsigned char *s, unsigned char *d, int lx,int lx2, int h)
{
	__asm__(
		".align	8\n"
		"1:"
	   		"movq		(%1),	%%mm0\n"      /* 8 s */
	   		"movq		(%4),	%%mm2\n"      /* 8 s +lx */
			"addl		%3,		%1\n"
			"pavgusb %%mm2, 	%%mm0\n"
	   		"movq		(%2),	%%mm3\n"      /* 8 d */
			"addl		%3,		%4\n"
			"pavgusb %%mm3, 	%%mm0\n"
			"movq		%%mm0,	(%2)\n"
			"addl		%3,		%2\n"
		"loop		1b\n"
      :
      : "c" (h), "r" (s), "r" (d), "r" (lx2), "r" (s +lx)
	);
}

static inline void rech_mmx(unsigned char *s, unsigned char *d, int lx2, int h)
{
	__asm__ (
		".align	8\n"
		"1:"
	   		"movq		(%1),	%%mm0\n"      /* 8 s */
	   		"movq		8(%1),	%%mm1\n"      /* 8 s */
	   		"movq		1(%1),	%%mm2\n"      /* 8 s */
	   		"movq		9(%1),	%%mm3\n"      /* 8 s */

			"pavgusb 	%%mm2, 	%%mm0\n"
			"addl		%3,		%1\n"
			"pavgusb 	%%mm3, 	%%mm1\n"

			"movq		%%mm0,	(%2)\n"
			"movq		%%mm1,	8(%2)\n"
			"addl		%3,		%2\n"
		"loop		1b\n"
      :
      : "c" (h), "r" (s), "r" (d), "r" (lx2)
	);
}

static inline void rechc_mmx(unsigned char *s, unsigned char *d, int lx2, int h)
{
	__asm__ (
		".align	8\n"
		"1:"
	   		"movq		(%1),	%%mm0\n"      /* 8 s */
	   		"movq		1(%1),	%%mm2\n"      /* 8 s +1 */
			"addl		%3,		%1\n"
			"pavgusb 	%%mm2, 	%%mm0\n"
			"movq		%%mm0,	(%2)\n"
			"addl		%3,		%2\n"
		"loop		1b\n"
      :
      : "c" (h), "r" (s), "r" (d), "r" (lx2)
	);
}

static inline void recha_mmx(unsigned char *s, unsigned char *d,int lx2, int h)
{
	__asm__ (
		".align	8\n"
		"1:"
	   		"movq		(%1),	%%mm0\n"      /* 8 s */
	   		"movq		8(%1),	%%mm1\n"      /* 8 s */
	   		"movq		1(%1),	%%mm2\n"      /* 8 s */
	   		"movq		9(%1),	%%mm3\n"      /* 8 s */

			"pavgusb 	%%mm2, 	%%mm0\n"
			"addl		%3,		%1\n"
			"pavgusb 	%%mm3, 	%%mm1\n"

	   		"movq		(%2),	%%mm2\n"      /* 8 d */
	   		"movq		8(%2),	%%mm3\n"      /* 8 d */
			"pavgusb 	%%mm2, 	%%mm0\n"
			"pavgusb 	%%mm3, 	%%mm1\n"

			"movq		%%mm0,	(%2)\n"
			"movq		%%mm1,	8(%2)\n"
			"addl		%3,		%2\n"
		"loop		1b\n"
      :
      : "c" (h), "r" (s), "r" (d), "r" (lx2)
	);
}

static inline void rechac_mmx(unsigned char *s,unsigned char  *d, int lx2, int h)
{
	__asm__ (
		".align	8\n"
		"1:"
	   		"movq		(%1),	%%mm0\n"      /* 8 s */
	   		"movq		1(%1),	%%mm2\n"      /* 8 s */

			"addl		%3,		%1\n"
			"pavgusb 	%%mm2, 	%%mm0\n"

	   		"movq		(%2),	%%mm1\n"      /* 8 d */
			"pavgusb 	%%mm1, 	%%mm0\n"

			"movq		%%mm0,	(%2)\n"
			"addl		%3,		%2\n"
		"loop		1b\n"
      :
      : "c" (h), "r" (s), "r" (d), "r" (lx2)
	);
}

static inline void rec4_mmx(unsigned char *s, unsigned char *d, int lx, int lx2, int h)
{
	__asm__ __volatile__(
	   	"movq		(%1),	%%mm0\n"  /* 8 s */
	   	"movq		8(%1),	%%mm1\n"  /* 8 s */
	   	"movq		1(%1),	%%mm2\n"  /* 8 s +1*/
	   	"movq		9(%1),	%%mm3\n"  /* 8 s +1*/
		".align 8\n"
		"1:"
	   		"movq		(%4),	%%mm4\n"  /* 8 s+lx */
			"pavgusb 	%%mm2, 	%%mm0\n"
	   		"movq		8(%4),	%%mm5\n"  /* 8 s+lx */
			"pavgusb 	%%mm3, 	%%mm1\n"

	   		"movq		1(%4),	%%mm6\n"  /* 8 s+lx +1*/
			"pavgusb 	%%mm4, 	%%mm0\n"
	   		"movq		9(%4),	%%mm7\n"  /* 8 s+lx +1*/
			"pavgusb 	%%mm5, 	%%mm1\n"

			"pavgusb 	%%mm6, 	%%mm0\n"
			"addl		%3,		%4\n"
			"pavgusb 	%%mm7, 	%%mm1\n"
			"movq		%%mm0,	(%2)\n"
			"movq		%%mm6,	%%mm2\n"
			"movq		%%mm7,	%%mm3\n"
			"movq		%%mm1,	8(%2)\n"
			"movq		%%mm4,	%%mm0\n"
			"movq		%%mm5,	%%mm1\n"
			"addl		%3,		%2\n"
		"loop		1b\n"
      	:
		: "c" (h), "r" (s), "r" (d), "r" (lx2), "r" (s +lx)
	);
}

static inline void rec4c_mmx(unsigned char *s, unsigned char *d, int lx, int lx2, int h)
{
	__asm__ __volatile__(
	   	"movq		(%1),	%%mm0\n"  /* 8 s */
	   	"movq		1(%1),	%%mm2\n"  /* 8 s +1*/
		".align 8\n"
		"1:"
	   		"movq		(%4),	%%mm4\n"  /* 8 s+lx */
			"pavgusb 	%%mm2, 	%%mm0\n"

	   		"movq		1(%4),	%%mm6\n"  /* 8 s+lx +1*/
			"pavgusb 	%%mm4, 	%%mm0\n"

			"addl		%3,		%4\n"
			"pavgusb 	%%mm6, 	%%mm0\n"
			"movq		%%mm0,	(%2)\n"
			"movq		%%mm6,	%%mm2\n"
			"movq		%%mm4,	%%mm0\n"
			"addl		%3,		%2\n"
		"loop		1b\n"
      	:
		: "c" (h), "r" (s), "r" (d), "r" (lx2), "r" (s +lx)
	);
}

static inline void rec4a_mmx(unsigned char *s, unsigned char *d, int lx, int lx2, int h)
{
	__asm__ __volatile__(
	   	"movq		(%1),	%%mm0\n"  /* 8 s */
	   	"movq		8(%1),	%%mm1\n"  /* 8 s */
	   	"movq		1(%1),	%%mm2\n"  /* 8 s +1*/
	   	"movq		9(%1),	%%mm3\n"  /* 8 s +1*/
		".align 8\n"
		"1:"
	   		"movq		(%4),	%%mm4\n"  /* 8 s+lx */
			"pavgusb 	%%mm2, 	%%mm0\n"
	   		"movq		8(%4),	%%mm5\n"  /* 8 s+lx */
			"pavgusb 	%%mm3, 	%%mm1\n"

	   		"movq		1(%4),	%%mm6\n"  /* 8 s+lx +1*/
			"pavgusb 	%%mm4, 	%%mm0\n"
	   		"movq		9(%4),	%%mm7\n"  /* 8 s+lx +1*/
			"pavgusb 	%%mm5, 	%%mm1\n"
			"movq		(%2),	%%mm2\n"
			"pavgusb 	%%mm6, 	%%mm0\n"
			"movq		8(%2),	%%mm3\n"

			"pavgusb 	%%mm2, 	%%mm0\n"
			"addl		%3,		%4\n"
			"pavgusb 	%%mm3, 	%%mm1\n"
			"movq		%%mm0,	(%2)\n"

			"pavgusb 	%%mm7, 	%%mm1\n"
			"movq		%%mm6,	%%mm2\n"
			"movq		%%mm7,	%%mm3\n"
			"movq		%%mm1,	8(%2)\n"
			"movq		%%mm4,	%%mm0\n"
			"movq		%%mm5,	%%mm1\n"
			"addl		%3,		%2\n"
		"loop		1b\n"
      	:
		: "c" (h), "r" (s), "r" (d), "r" (lx2), "r" (s +lx)
	);
}

static inline void rec4ac_mmx(unsigned char *s, unsigned char  *d, int lx, int lx2, int h)
{
	__asm__ __volatile__(
	   	"movq		(%1),	%%mm0\n"  /* 8 s */
	   	"movq		1(%1),	%%mm2\n"  /* 8 s +1*/
		".align 8\n"
		"1:"
	   		"movq		(%4),	%%mm4\n"  /* 8 s+lx */
			"pavgusb 	%%mm2, 	%%mm0\n"

	   		"movq		1(%4),	%%mm6\n"  /* 8 s+lx +1*/
			"pavgusb 	%%mm4, 	%%mm0\n"
			"movq		(%2),	%%mm1\n"  /* 8 d */
			"pavgusb 	%%mm6, 	%%mm0\n"
			"addl		%3,		%4\n"
			"pavgusb 	%%mm1, 	%%mm0\n"
			"movq		%%mm6,	%%mm2\n"
			"movq		%%mm0,	(%2)\n"
			"movq		%%mm4,	%%mm0\n"
			"addl		%3,		%2\n"
		"loop		1b\n"
      	:
		: "c" (h), "r" (s), "r" (d), "r" (lx2), "r" (s +lx)
	);
}

#else  // HAVE_3DNOW
	static long long ADD_1	=	0x0101010101010101LL;
	static long long MASK_AND = 0x7f7f7f7f7f7f7f7fLL;
#endif

static inline void rec_mmx(unsigned char *s, unsigned char *d, int lx2, int h)
{
	__asm__ __volatile__(
		".align 8\n"
		"1:\t"
			"movq ( %1 ),     	%%mm0\n"			/* 8 s */
		    "movq 8( %1 ),    	%%mm2\n"			/* 16 s */
		    "movq %%mm0,  		( %2 )\n"   
			"addl %3,			%1\n"
		    "movq %%mm2,  		8( %2 )\n"   
			"decl %0\n"		
		    "leal (%2, %3), %2\n"
	 	"jnz    1b"            
		: 
		: "c" (h), "r" (s), "r" (d), "r" (lx2)
	);   
}


static inline void recc_mmx(unsigned char *s, unsigned char *d, int lx2, int h)
{
	__asm__ __volatile__(
		".align 8\n"
	    "1:\t"
	    	"movq ( %1 ),     %%mm0\n"
	      	"addl %3,   	  %1\n"
	      	"movq %%mm0,  	  ( %2 )\n"   
			"decl %0\n"
	      	"leal (%2, %3), %2\n"
	   	"jnz    1b"            
		: 
		: "c" (h), "r" (s), "r" (d), "r" (lx2)
	);   
}


static inline void reca_mmx(unsigned char *s, unsigned char  *d, int lx2, int h)
{
#ifdef HAVE_3Dnow
	__asm__ (
		".align	8\n"
		"1:"
		   	"movq		(%1),	%%mm0\n"      /* 8 s */
			"movq		(%2),	%%mm2\n"      /* 8 d */
		   	"movq		8(%1),	%%mm1\n"      /* 8 s */
		   	"movq		8(%2),	%%mm3\n"      /* 8 d */
			"pavgusb 	%%mm2, 	%%mm0\n"
			"addl		%3,		%1\n"
			"pavgusb 	%%mm3, 	%%mm1\n"

			"movq		%%mm0,	(%2)\n"
			"movq		%%mm1,	8(%2)\n"
			"addl		%3,		%2\n"
		"loop		1b\n"
		:
		: "c" (h), "r" (s), "r" (d), "r" (lx2)
	);
#else   /* No 3dnow */
	__asm__ (
  		"movq	     _MASK_AND, 	%%mm5\n"
  		"movq	     _ADD_1, 	%%mm6\n"
		"1:\t"
  			"movq        (%1),%%mm0\n"        /* Load 16 pixels from each row */
  			"movq        (%2),%%mm1\n"
  			"movq       8(%1),%%mm2\n"
  			"movq       8(%2),%%mm3\n"
  			"psrlw		$1,%%mm0\n"           /* Shift pixels down */
  			"psrlw	    $1,%%mm1\n"
  			"pand	    %%mm5,%%mm0\n"        /* Zero out significant bit */
  			"psrlw	    $1,%%mm2\n"
  			"pand	    %%mm5,%%mm1\n"
  			"psrlw	    $1,%%mm3\n"
  			"pand	    %%mm5,%%mm2\n"
  			"paddusb    %%mm1,%%mm0\n"        /* Add pixels */
  			"pand	    %%mm5,%%mm3\n"
  			"paddusb    %%mm3,%%mm2\n"
  			"paddusb    %%mm6,%%mm0\n"        /* Add 1 to results */
  			"paddusb    %%mm6,%%mm2\n"
  			"movq       %%mm0,(%2)\n"
  			"addl       %3,%1\n"
  			"movq	    %%mm2, 8(%2)\n"
  			"decl       %0\n"
  			"leal		(%2, %3), %2\n"
  		"jnz        1b\n"
		:
		: "c" (h), "r" (s), "r" (d), "r" (lx2)
	);
#endif
}


static inline void recac_mmx(unsigned char *s, unsigned char *d, int lx2, int h)
{
#ifdef HAVE_3Dnow
	__asm__ (
		".align	8\n"
		"1:"
		   	"movq		(%1),	%%mm0\n"      /* 8 s */
	   		"movq		(%2),	%%mm2\n"      /* 8 d */
			"pavgusb 	%%mm2, 	%%mm0\n"
			"addl		%3,		%1\n"
			"movq		%%mm0,	(%2)\n"
			"addl		%3,		%2\n"
		"loop		1b\n"
		:
		: "c" (h), "r" (s), "r" (d), "r" (lx2)
	);
#else /* No 3dnow */
	__asm__ (
  		"movq	     _MASK_AND, 	%%mm5\n"
  		"movq	     _ADD_1, 	%%mm6\n"
		"1:\t"
  			"movq       (%1),%%mm0\n"
  			"movq       (%2),%%mm1\n"
  			"psrlw		$1,%%mm0\n"
  			"psrlw	    $1,%%mm1\n"
  			"pand	    %%mm5,%%mm0\n"
  			"pand	    %%mm5,%%mm1\n"
  			"paddusb    %%mm1,%%mm0\n"
  			"paddusb    %%mm6,%%mm0\n"
  			"addl       %3,%1\n"
  			"movq       %%mm0,(%2)\n"
  			"decl       %0\n"
  			"leal		(%2, %3), %2\n"
  		"jnz        1b\n"
		:
		: "c" (h), "r" (s), "r" (d), "r" (lx2)
		);
#endif
}


static inline void recv_mmx(unsigned char *s, unsigned char *d, int lx, int lx2, int h)
{
#ifdef HAVE_3Dnow
	__asm__(
		".align	8\n"
		"1:"
	   		"movq		(%1),	%%mm0\n"      /* 8 s */
	   		"movq		(%4),	%%mm2\n"      /* 8 s +lx */
	   		"movq		8(%1),	%%mm1\n"      /* 8 s */
	   		"movq		8(%4),	%%mm3\n"      /* 8 s +lx **/

			"pavgusb %%mm2, 	%%mm0\n"
			"addl		%3,		%1\n"
			"pavgusb %%mm3, 	%%mm1\n"

			"movq		%%mm0,	(%2)\n"
			"addl		%3,		%4\n"
			"movq		%%mm1,	8(%2)\n"
			"addl		%3,		%2\n"
		"loop		1b\n"
      :
      : "c" (h), "r" (s), "r" (d), "r" (lx2), "r" (s +lx)
	);
#else
	__asm__ (
  		"movq	     _MASK_AND, 	%%mm5\n"
  		"movq	     _ADD_1, 	%%mm6\n"
		"1:\t"
	   		"movq		(%1),	%%mm0\n"      /* 8 s */
	   		"movq		(%4),	%%mm1\n"      /* 8 s +lx */
	   		"movq		8(%1),	%%mm2\n"      /* 8 s */
	   		"movq		8(%4),	%%mm3\n"      /* 8 s +lx **/
  			"psrlw      $1,%%mm0\n"
  			"psrlw      $1,%%mm1\n"
  			"pand       %%mm5,%%mm0\n"
  			"psrlw      $1,%%mm2\n"
  			"pand       %%mm5,%%mm1\n"
  			"psrlw      $1,%%mm3\n"
  			"pand       %%mm5,%%mm2\n"
  			"paddusb    %%mm1,%%mm0\n"
  			"pand       %%mm5,%%mm3\n"
  			"paddusb    %%mm3,%%mm2\n"
  			"paddusb    %%mm6,%%mm0\n"
  			"paddusb    %%mm6,%%mm2\n"
  			"movq       %%mm0,(%2)\n"
  			"addl       %3,%1\n"
  			"movq	    %%mm2, 8(%2)\n"
  			"addl       %3,%4\n"
  			"decl       %0\n"
  			"leal		(%2, %3), %2\n"
  		"jnz        1b\n"
      :
      : "c" (h), "r" (s), "r" (d), "r" (lx2), "r" (s +lx)
	);
#endif
}


static inline void recvc_mmx(unsigned char *s, unsigned char *d, int lx, int lx2, int h)
{
#ifdef HAVE_3Dnow
	__asm__(
		".align	8\n"
		"1:"
	   		"movq		(%1),	%%mm0\n"      /* 8 s */
	   		"movq		(%4),	%%mm2\n"      /* 8 s +lx */
			"addl		%3,		%1\n"
			"pavgusb %%mm2, 	%%mm0\n"
			"addl		%3,		%4\n"
			"movq		%%mm0,	(%2)\n"
			"addl		%3,		%2\n"
		"loop		1b\n"
      :
      : "c" (h), "r" (s), "r" (d), "r" (lx2), "r" (s +lx)
	);
#else
	__asm__ (
  		"movq	     _MASK_AND, 	%%mm5\n"
  		"movq	     _ADD_1, 	%%mm6\n"
		"1:\t"
	   		"movq		(%1),	%%mm0\n"      /* 8 s */
	   		"movq		(%4),	%%mm1\n"      /* 8 s +lx */
  			"psrlw      $1,%%mm0\n"
  			"psrlw      $1,%%mm1\n"
  			"pand       %%mm5,%%mm0\n"
  			"pand       %%mm5,%%mm1\n"
  			"paddusb    %%mm1,%%mm0\n"
  			"addl       %3,%1\n"
  			"paddusb    %%mm6,%%mm0\n"
  			"addl       %3,%4\n"
  			"movq       %%mm0,(%2)\n"
  			"decl       %0\n"
  			"leal		(%2, %3), %2\n"
  		"jnz        1b\n"
      :
      : "c" (h), "r" (s), "r" (d), "r" (lx2), "r" (s +lx)
	);
#endif
}

#endif  // HAVE_MMX

static inline void rec(unsigned char *s, unsigned char *d, int lx2, int h)
{
	int j;
# ifdef __POWERPC__
        unsigned long t1,t2,t3,t4;
#endif
	for(j = 0; j < h; j++, s += lx2, d += lx2)
	{
# ifdef __POWERPC__
        t1 = *(unsigned long *) s;
        t2 = *(((unsigned long *) s)+1);
        t3 = *(((unsigned long *) s)+2);
        t4 = *(((unsigned long *) s)+3);
        *(unsigned long *) d = t1;
        *(((unsigned long *) d)+1) = t2;
        *(((unsigned long *) d)+2) = t3;
        *(((unsigned long *) d)+3) = t4;
#else
    	d[0] = s[0]; d[1] = s[1]; d[2] = s[2]; d[3] = s[3];
    	d[4] = s[4]; d[5] = s[5]; d[6] = s[6]; d[7] = s[7];
    	d[8] = s[8]; d[9] = s[9]; d[10] = s[10]; d[11] = s[11];
    	d[12] = s[12]; d[13] = s[13]; d[14] = s[14]; d[15] = s[15];
#endif
	}
}



static inline void recc(unsigned char *s, unsigned char *d, int lx2, int h)
{
	int j;
# ifdef __POWERPC__
        long t1,t2;
#endif
	for(j = 0; j < h; j++, s += lx2, d += lx2)
	{
# ifdef __POWERPC__
        t1 = *(long *) s;
        t2 = *(((long *) s)+1);
        *(long *) d = t1;
        *(((long *) d)+1) = t2;
#else
    	d[0] = s[0]; d[1] = s[1]; d[2] = s[2]; d[3] = s[3];
    	d[4] = s[4]; d[5] = s[5]; d[6] = s[6]; d[7] = s[7];
#endif
	}
}

static inline void reca(unsigned char *s, unsigned char  *d, int lx2, int h)
{
	int j;
	for(j = 0; j < h; j++, s +=lx2, d +=lx2)
	{
    	d[0] = (unsigned int)(d[0] + s[0] + 1) >> 1;
    	d[1] = (unsigned int)(d[1] + s[1] + 1) >> 1;
    	d[2] = (unsigned int)(d[2] + s[2] + 1) >> 1;
    	d[3] = (unsigned int)(d[3] + s[3] + 1) >> 1;
    	d[4] = (unsigned int)(d[4] + s[4] + 1) >> 1;
    	d[5] = (unsigned int)(d[5] + s[5] + 1) >> 1;
    	d[6] = (unsigned int)(d[6] + s[6] + 1) >> 1;
    	d[7] = (unsigned int)(d[7] + s[7] + 1) >> 1;
    	d[8] = (unsigned int)(d[8] + s[8] + 1) >> 1;
    	d[9] = (unsigned int)(d[9] + s[9] + 1) >> 1;
    	d[10] = (unsigned int)(d[10] + s[10] + 1) >> 1;
    	d[11] = (unsigned int)(d[11] + s[11] + 1) >> 1;
    	d[12] = (unsigned int)(d[12] + s[12] + 1) >> 1;
    	d[13] = (unsigned int)(d[13] + s[13] + 1) >> 1;
    	d[14] = (unsigned int)(d[14] + s[14] + 1) >> 1;
    	d[15] = (unsigned int)(d[15] + s[15] + 1) >> 1;
	}
}

static inline void recac(unsigned char *s, unsigned char *d, int lx2, int h)
{
	int j;
	for(j = 0; j < h; j++, s += lx2, d += lx2)
	{
    	d[0] = (unsigned int)(d[0] + s[0] + 1)>>1;
    	d[1] = (unsigned int)(d[1] + s[1] + 1)>>1;
    	d[2] = (unsigned int)(d[2] + s[2] + 1)>>1;
    	d[3] = (unsigned int)(d[3] + s[3] + 1)>>1;
    	d[4] = (unsigned int)(d[4] + s[4] + 1)>>1;
    	d[5] = (unsigned int)(d[5] + s[5] + 1)>>1;
    	d[6] = (unsigned int)(d[6] + s[6] + 1)>>1;
    	d[7] = (unsigned int)(d[7] + s[7] + 1)>>1;
	}
}

static inline void recv(unsigned char *s, unsigned char *d, int lx, int lx2, int h)
{
	unsigned char *dp,*sp,*sp2;
	int j;
	sp = s;
	sp2 = s + lx;
	dp = d;
	for(j = 0; j < h; j++)
	{
    	dp[0] = (unsigned int)(sp[0] + sp2[0] + 1) >> 1;
    	dp[1] = (unsigned int)(sp[1] + sp2[1] + 1) >> 1;
    	dp[2] = (unsigned int)(sp[2] + sp2[2] + 1) >> 1;
    	dp[3] = (unsigned int)(sp[3] + sp2[3] + 1) >> 1;
    	dp[4] = (unsigned int)(sp[4] + sp2[4] + 1) >> 1;
    	dp[5] = (unsigned int)(sp[5] + sp2[5] + 1) >> 1;
    	dp[6] = (unsigned int)(sp[6] + sp2[6] + 1) >> 1;
    	dp[7] = (unsigned int)(sp[7] + sp2[7] + 1) >> 1;
    	dp[8] = (unsigned int)(sp[8] + sp2[8] + 1) >> 1;
    	dp[9] = (unsigned int)(sp[9] + sp2[9] + 1) >> 1;
    	dp[10] = (unsigned int)(sp[10] + sp2[10] + 1) >> 1;
    	dp[11] = (unsigned int)(sp[11] + sp2[11] + 1) >> 1;
    	dp[12] = (unsigned int)(sp[12] + sp2[12] + 1) >> 1;
    	dp[13] = (unsigned int)(sp[13] + sp2[13] + 1) >> 1;
    	dp[14] = (unsigned int)(sp[14] + sp2[14] + 1) >> 1;
    	dp[15] = (unsigned int)(sp[15] + sp2[15] + 1) >> 1;
    	sp+= lx2;
    	sp2+= lx2;
    	dp+= lx2;
	}
}

static inline void recvc(unsigned char *s, unsigned char *d, int lx, int lx2, int h)
{
	unsigned char *dp,*sp,*sp2;
	int j;

	sp = s;
	sp2 = s+lx;
	dp = d;
	for(j = 0; j < h; j++)
	{
    	dp[0] = (unsigned int)(sp[0]+sp2[0]+1)>>1;
    	dp[1] = (unsigned int)(sp[1]+sp2[1]+1)>>1;
    	dp[2] = (unsigned int)(sp[2]+sp2[2]+1)>>1;
    	dp[3] = (unsigned int)(sp[3]+sp2[3]+1)>>1;
    	dp[4] = (unsigned int)(sp[4]+sp2[4]+1)>>1;
    	dp[5] = (unsigned int)(sp[5]+sp2[5]+1)>>1;
    	dp[6] = (unsigned int)(sp[6]+sp2[6]+1)>>1;
    	dp[7] = (unsigned int)(sp[7]+sp2[7]+1)>>1;
    	sp+= lx2;
    	sp2+= lx2;
    	dp+= lx2;
	}
}


static inline void recva(unsigned char *s, unsigned char *d, int lx, int lx2, int h)
{
	unsigned char *dp,*sp,*sp2;
	int j;

	sp = s;
	sp2 = s+lx;
	dp = d;
	for (j=0; j<h; j++){
    	dp[0] = (dp[0] + ((unsigned int)(sp[0]+sp2[0]+1)>>1) + 1)>>1;
    	dp[1] = (dp[1] + ((unsigned int)(sp[1]+sp2[1]+1)>>1) + 1)>>1;
    	dp[2] = (dp[2] + ((unsigned int)(sp[2]+sp2[2]+1)>>1) + 1)>>1;
    	dp[3] = (dp[3] + ((unsigned int)(sp[3]+sp2[3]+1)>>1) + 1)>>1;
    	dp[4] = (dp[4] + ((unsigned int)(sp[4]+sp2[4]+1)>>1) + 1)>>1;
    	dp[5] = (dp[5] + ((unsigned int)(sp[5]+sp2[5]+1)>>1) + 1)>>1;
    	dp[6] = (dp[6] + ((unsigned int)(sp[6]+sp2[6]+1)>>1) + 1)>>1;
    	dp[7] = (dp[7] + ((unsigned int)(sp[7]+sp2[7]+1)>>1) + 1)>>1;
    	dp[8] = (dp[8] + ((unsigned int)(sp[8]+sp2[8]+1)>>1) + 1)>>1;
    	dp[9] = (dp[9] + ((unsigned int)(sp[9]+sp2[9]+1)>>1) + 1)>>1;
    	dp[10] = (dp[10] + ((unsigned int)(sp[10]+sp2[10]+1)>>1) + 1)>>1;
    	dp[11] = (dp[11] + ((unsigned int)(sp[11]+sp2[11]+1)>>1) + 1)>>1;
    	dp[12] = (dp[12] + ((unsigned int)(sp[12]+sp2[12]+1)>>1) + 1)>>1;
    	dp[13] = (dp[13] + ((unsigned int)(sp[13]+sp2[13]+1)>>1) + 1)>>1;
    	dp[14] = (dp[14] + ((unsigned int)(sp[14]+sp2[14]+1)>>1) + 1)>>1;
    	dp[15] = (dp[15] + ((unsigned int)(sp[15]+sp2[15]+1)>>1) + 1)>>1;
    	sp+= lx2;
    	sp2+= lx2;
    	dp+= lx2;
	}
}


static inline void recvac(unsigned char *s, unsigned char *d, int lx,int lx2, int h){
  unsigned char *dp,*sp,*sp2;
	int j;

  sp = s;
  sp2 = s+lx;
  dp = d;
  for (j=0; j<h; j++){
    dp[0] = (dp[0] + ((unsigned int)(sp[0]+sp2[0]+1)>>1) + 1)>>1;
    dp[1] = (dp[1] + ((unsigned int)(sp[1]+sp2[1]+1)>>1) + 1)>>1;
    dp[2] = (dp[2] + ((unsigned int)(sp[2]+sp2[2]+1)>>1) + 1)>>1;
    dp[3] = (dp[3] + ((unsigned int)(sp[3]+sp2[3]+1)>>1) + 1)>>1;
    dp[4] = (dp[4] + ((unsigned int)(sp[4]+sp2[4]+1)>>1) + 1)>>1;
    dp[5] = (dp[5] + ((unsigned int)(sp[5]+sp2[5]+1)>>1) + 1)>>1;
    dp[6] = (dp[6] + ((unsigned int)(sp[6]+sp2[6]+1)>>1) + 1)>>1;
    dp[7] = (dp[7] + ((unsigned int)(sp[7]+sp2[7]+1)>>1) + 1)>>1;
    sp+= lx2;
    sp2+= lx2;
    dp+= lx2;
  }
}


static inline void rech(unsigned char *s, unsigned char *d, int lx2, int h){
  unsigned char *dp,*sp;
  unsigned int s1,s2;
	int j;

  sp = s;
  dp = d;
  for (j=0; j<h; j++){
    s1=sp[0];
    dp[0] = (unsigned int)(s1+(s2=sp[1])+1)>>1;
    dp[1] = (unsigned int)(s2+(s1=sp[2])+1)>>1;
    dp[2] = (unsigned int)(s1+(s2=sp[3])+1)>>1;
    dp[3] = (unsigned int)(s2+(s1=sp[4])+1)>>1;
    dp[4] = (unsigned int)(s1+(s2=sp[5])+1)>>1;
    dp[5] = (unsigned int)(s2+(s1=sp[6])+1)>>1;
    dp[6] = (unsigned int)(s1+(s2=sp[7])+1)>>1;
    dp[7] = (unsigned int)(s2+(s1=sp[8])+1)>>1;
    dp[8] = (unsigned int)(s1+(s2=sp[9])+1)>>1;
    dp[9] = (unsigned int)(s2+(s1=sp[10])+1)>>1;
    dp[10] = (unsigned int)(s1+(s2=sp[11])+1)>>1;
    dp[11] = (unsigned int)(s2+(s1=sp[12])+1)>>1;
    dp[12] = (unsigned int)(s1+(s2=sp[13])+1)>>1;
    dp[13] = (unsigned int)(s2+(s1=sp[14])+1)>>1;
    dp[14] = (unsigned int)(s1+(s2=sp[15])+1)>>1;
    dp[15] = (unsigned int)(s2+sp[16]+1)>>1;
    sp+= lx2;
    dp+= lx2;
  }
}


static inline void rechc(unsigned char *s,unsigned char *d, int lx2, int h){
  unsigned char *dp,*sp;
  unsigned int s1,s2;
	int j;

  sp = s;
  dp = d;
  for (j=0; j<h; j++){
    s1=sp[0];
    dp[0] = (unsigned int)(s1+(s2=sp[1])+1)>>1;
    dp[1] = (unsigned int)(s2+(s1=sp[2])+1)>>1;
    dp[2] = (unsigned int)(s1+(s2=sp[3])+1)>>1;
    dp[3] = (unsigned int)(s2+(s1=sp[4])+1)>>1;
    dp[4] = (unsigned int)(s1+(s2=sp[5])+1)>>1;
    dp[5] = (unsigned int)(s2+(s1=sp[6])+1)>>1;
    dp[6] = (unsigned int)(s1+(s2=sp[7])+1)>>1;
    dp[7] = (unsigned int)(s2+sp[8]+1)>>1;
    sp+= lx2;
    dp+= lx2;
  }
}

static inline void recha(unsigned char *s, unsigned char *d,int lx2, int h)
{
	unsigned char *dp,*sp;
	unsigned int s1,s2;
	int j;

	sp = s;
	dp = d;
	for (j = 0; j < h; j++)
	{
    	s1 = sp[0];
    	dp[0] = (dp[0] + ((unsigned int)(s1 + (s2 = sp[1]) + 1) >> 1) + 1) >> 1;
    	dp[1] = (dp[1] + ((unsigned int)(s2 + (s1 = sp[2]) + 1) >> 1) + 1) >> 1;
    	dp[2] = (dp[2] + ((unsigned int)(s1 + (s2 = sp[3]) + 1) >> 1) + 1) >> 1;
    	dp[3] = (dp[3] + ((unsigned int)(s2 + (s1 = sp[4]) + 1) >> 1) + 1) >> 1;
    	dp[4] = (dp[4] + ((unsigned int)(s1 + (s2 = sp[5]) + 1) >> 1) + 1) >> 1;
    	dp[5] = (dp[5] + ((unsigned int)(s2 + (s1 = sp[6]) + 1) >> 1) + 1) >> 1;
    	dp[6] = (dp[6] + ((unsigned int)(s1 + (s2 = sp[7]) + 1) >> 1) + 1) >> 1;
    	dp[7] = (dp[7] + ((unsigned int)(s2 + (s1 = sp[8]) + 1) >> 1) + 1) >> 1;
    	dp[8] = (dp[8] + ((unsigned int)(s1 + (s2 = sp[9]) + 1) >> 1) + 1) >> 1;
    	dp[9] = (dp[9] + ((unsigned int)(s2 + (s1 = sp[10]) + 1) >> 1) + 1) >> 1;
    	dp[10] = (dp[10] + ((unsigned int)(s1 + (s2 = sp[11]) + 1) >> 1) + 1) >> 1;
    	dp[11] = (dp[11] + ((unsigned int)(s2 + (s1 = sp[12]) + 1) >> 1) + 1) >> 1;
    	dp[12] = (dp[12] + ((unsigned int)(s1 + (s2 = sp[13]) + 1) >> 1) + 1) >> 1;
    	dp[13] = (dp[13] + ((unsigned int)(s2 + (s1 = sp[14]) + 1) >> 1) + 1) >> 1;
    	dp[14] = (dp[14] + ((unsigned int)(s1 + (s2 = sp[15]) + 1) >> 1) + 1) >> 1;
    	dp[15] = (dp[15] + ((unsigned int)(s2 + sp[16] + 1) >> 1) + 1) >> 1;
    	sp += lx2;
    	dp += lx2;
	}
}


static inline void rechac(unsigned char *s,unsigned char  *d, int lx2, int h)
{
	unsigned char *dp,*sp;
	unsigned int s1,s2;
	int j;

	sp = s;
	dp = d;
	for(j = 0; j < h; j++)
	{
    	s1 = sp[0];
    	dp[0] = (dp[0] + ((unsigned int)(s1 + (s2 = sp[1]) + 1) >> 1) + 1) >> 1;
    	dp[1] = (dp[1] + ((unsigned int)(s2 + (s1 = sp[2]) + 1) >> 1) + 1) >> 1;
    	dp[2] = (dp[2] + ((unsigned int)(s1 + (s2 = sp[3]) + 1) >> 1) + 1) >> 1;
    	dp[3] = (dp[3] + ((unsigned int)(s2 + (s1 = sp[4]) + 1) >> 1) + 1) >> 1;
    	dp[4] = (dp[4] + ((unsigned int)(s1 + (s2 = sp[5]) + 1) >> 1) + 1) >> 1;
    	dp[5] = (dp[5] + ((unsigned int)(s2 + (s1 = sp[6]) + 1) >> 1) + 1) >> 1;
    	dp[6] = (dp[6] + ((unsigned int)(s1 + (s2 = sp[7]) + 1) >> 1) + 1) >> 1;
    	dp[7] = (dp[7] + ((unsigned int)(s2 + sp[8] + 1) >> 1) + 1) >> 1;
    	sp += lx2;
    	dp += lx2;
	}
}


static inline void rec4(unsigned char *s, unsigned char *d, int lx, int lx2, int h)
{
  unsigned char *dp,*sp,*sp2;
  unsigned int s1,s2,s3,s4;
	int j;

  sp = s;
  sp2 = s+lx;
  dp = d;
  for (j=0; j<h; j++){
    s1=sp[0]; s3=sp2[0];
    dp[0] = (unsigned int)(s1+(s2=sp[1])+s3+(s4=sp2[1])+2)>>2;
    dp[1] = (unsigned int)(s2+(s1=sp[2])+s4+(s3=sp2[2])+2)>>2;
    dp[2] = (unsigned int)(s1+(s2=sp[3])+s3+(s4=sp2[3])+2)>>2;
    dp[3] = (unsigned int)(s2+(s1=sp[4])+s4+(s3=sp2[4])+2)>>2;
    dp[4] = (unsigned int)(s1+(s2=sp[5])+s3+(s4=sp2[5])+2)>>2;
    dp[5] = (unsigned int)(s2+(s1=sp[6])+s4+(s3=sp2[6])+2)>>2;
    dp[6] = (unsigned int)(s1+(s2=sp[7])+s3+(s4=sp2[7])+2)>>2;
    dp[7] = (unsigned int)(s2+(s1=sp[8])+s4+(s3=sp2[8])+2)>>2;
    dp[8] = (unsigned int)(s1+(s2=sp[9])+s3+(s4=sp2[9])+2)>>2;
    dp[9] = (unsigned int)(s2+(s1=sp[10])+s4+(s3=sp2[10])+2)>>2;
    dp[10] = (unsigned int)(s1+(s2=sp[11])+s3+(s4=sp2[11])+2)>>2;
    dp[11] = (unsigned int)(s2+(s1=sp[12])+s4+(s3=sp2[12])+2)>>2;
    dp[12] = (unsigned int)(s1+(s2=sp[13])+s3+(s4=sp2[13])+2)>>2;
    dp[13] = (unsigned int)(s2+(s1=sp[14])+s4+(s3=sp2[14])+2)>>2;
    dp[14] = (unsigned int)(s1+(s2=sp[15])+s3+(s4=sp2[15])+2)>>2;
    dp[15] = (unsigned int)(s2+sp[16]+s4+sp2[16]+2)>>2;
    sp+= lx2;
    sp2+= lx2;
    dp+= lx2;
  }
}


static inline void rec4c(unsigned char *s,unsigned char *d, int lx, int lx2, int h)
{
  unsigned char *dp,*sp,*sp2;
  unsigned int s1,s2,s3,s4;
	int j;

  sp = s;
  sp2 = s+lx;
  dp = d;
  for (j=0; j<h; j++){
    s1=sp[0]; s3=sp2[0];
    dp[0] = (unsigned int)(s1+(s2=sp[1])+s3+(s4=sp2[1])+2)>>2;
    dp[1] = (unsigned int)(s2+(s1=sp[2])+s4+(s3=sp2[2])+2)>>2;
    dp[2] = (unsigned int)(s1+(s2=sp[3])+s3+(s4=sp2[3])+2)>>2;
    dp[3] = (unsigned int)(s2+(s1=sp[4])+s4+(s3=sp2[4])+2)>>2;
    dp[4] = (unsigned int)(s1+(s2=sp[5])+s3+(s4=sp2[5])+2)>>2;
    dp[5] = (unsigned int)(s2+(s1=sp[6])+s4+(s3=sp2[6])+2)>>2;
    dp[6] = (unsigned int)(s1+(s2=sp[7])+s3+(s4=sp2[7])+2)>>2;
    dp[7] = (unsigned int)(s2+sp[8]+s4+sp2[8]+2)>>2;
    sp+= lx2;
    sp2+= lx2;
    dp+= lx2;
  }
}


static inline void rec4a(unsigned char *s,unsigned char *d, int lx, int lx2, int h)
{
  unsigned char *dp=d, *sp=s, *sp2=s+lx;
  unsigned int s1, s2, s3, s4;
	int j;

/*
  sp = s;
  sp2 = s+lx;
  dp = d;
*/
  for (j=0; j<h; j++){
    s1=sp[0]; s3=sp2[0];
    dp[0] = (dp[0] + ((unsigned int)(s1+(s2=sp[1])+s3+(s4=sp2[1])+2)>>2) + 1)>>1;
    dp[1] = (dp[1] + ((unsigned int)(s2+(s1=sp[2])+s4+(s3=sp2[2])+2)>>2) + 1)>>1;
    dp[2] = (dp[2] + ((unsigned int)(s1+(s2=sp[3])+s3+(s4=sp2[3])+2)>>2) + 1)>>1;
    dp[3] = (dp[3] + ((unsigned int)(s2+(s1=sp[4])+s4+(s3=sp2[4])+2)>>2) + 1)>>1;
    dp[4] = (dp[4] + ((unsigned int)(s1+(s2=sp[5])+s3+(s4=sp2[5])+2)>>2) + 1)>>1;
    dp[5] = (dp[5] + ((unsigned int)(s2+(s1=sp[6])+s4+(s3=sp2[6])+2)>>2) + 1)>>1;
    dp[6] = (dp[6] + ((unsigned int)(s1+(s2=sp[7])+s3+(s4=sp2[7])+2)>>2) + 1)>>1;
    dp[7] = (dp[7] + ((unsigned int)(s2+(s1=sp[8])+s4+(s3=sp2[8])+2)>>2) + 1)>>1;
    dp[8] = (dp[8] + ((unsigned int)(s1+(s2=sp[9])+s3+(s4=sp2[9])+2)>>2) + 1)>>1;
    dp[9] = (dp[9] + ((unsigned int)(s2+(s1=sp[10])+s4+(s3=sp2[10])+2)>>2) + 1)>>1;
    dp[10] = (dp[10] + ((unsigned int)(s1+(s2=sp[11])+s3+(s4=sp2[11])+2)>>2) + 1)>>1;
    dp[11] = (dp[11] + ((unsigned int)(s2+(s1=sp[12])+s4+(s3=sp2[12])+2)>>2) + 1)>>1;
    dp[12] = (dp[12] + ((unsigned int)(s1+(s2=sp[13])+s3+(s4=sp2[13])+2)>>2) + 1)>>1;
    dp[13] = (dp[13] + ((unsigned int)(s2+(s1=sp[14])+s4+(s3=sp2[14])+2)>>2) + 1)>>1;
    dp[14] = (dp[14] + ((unsigned int)(s1+(s2=sp[15])+s3+(s4=sp2[15])+2)>>2) + 1)>>1;
    dp[15] = (dp[15] + ((unsigned int)(s2+sp[16]+s4+sp2[16]+2)>>2) + 1)>>1;
    sp+= lx2;
    sp2+= lx2;
    dp+= lx2;
  }
}


static inline void rec4ac(unsigned char *s,unsigned char  *d, int lx, int lx2, int h)
{
  unsigned char *dp=d, *sp=s, *sp2=s+lx;
  unsigned int s1,s2,s3,s4;
	int j;

/*
  sp = s;
  sp2 = s+lx;
  dp = d;
*/
	for (j=0; j<h; j++)
	{
    	s1=sp[0]; s3=sp2[0];
    	dp[0] = (dp[0] + ((unsigned int)(s1+(s2=sp[1])+s3+(s4=sp2[1])+2)>>2) + 1)>>1;
    	dp[1] = (dp[1] + ((unsigned int)(s2+(s1=sp[2])+s4+(s3=sp2[2])+2)>>2) + 1)>>1;
    	dp[2] = (dp[2] + ((unsigned int)(s1+(s2=sp[3])+s3+(s4=sp2[3])+2)>>2) + 1)>>1;
    	dp[3] = (dp[3] + ((unsigned int)(s2+(s1=sp[4])+s4+(s3=sp2[4])+2)>>2) + 1)>>1;
    	dp[4] = (dp[4] + ((unsigned int)(s1+(s2=sp[5])+s3+(s4=sp2[5])+2)>>2) + 1)>>1;
    	dp[5] = (dp[5] + ((unsigned int)(s2+(s1=sp[6])+s4+(s3=sp2[6])+2)>>2) + 1)>>1;
    	dp[6] = (dp[6] + ((unsigned int)(s1+(s2=sp[7])+s3+(s4=sp2[7])+2)>>2) + 1)>>1;
    	dp[7] = (dp[7] + ((unsigned int)(s2+sp[8]+s4+sp2[8]+2)>>2) + 1)>>1;
    	sp+= lx2;
    	sp2+= lx2;
    	dp+= lx2;
	}
}

static inline
void recon_comp(mpeg3video_t *video, 
		unsigned char *src, 
		unsigned char *dst, 
		int lx, 
		int lx2,
		int w, 
		int h, 
		int x, 
		int y, 
		int dx, 
		int dy, 
		int addflag)
{
	int switcher;
	unsigned char *s, *d;

/* half pel scaling */
	switcher = (dx & 1) << 3 | (dy & 1) << 2 | w;
	if(addflag) switcher |= 2; 
/* origins */
	s = src + lx * (y + (dy >> 1)) + x + (dx >> 1);
	d = dst + lx * y + x;

// Accelerated functions
#ifdef HAVE_MMX
	if(video->have_mmx)
	{
		switch(switcher)
		{
			case 0x3: 	reca_mmx(s, d, lx2, h);       break;
			case 0x2:	recac_mmx(s, d, lx2, h);      break;
			case 0x1:	rec_mmx(s, d, lx2, h);        break;
			case 0x0:	recc_mmx(s, d, lx2, h);       break;
			case 0x7:   recva(s, d, lx, lx2, h);  break;
			case 0x6:   recvac(s, d, lx, lx2, h); break;
			case 0x5:	recv_mmx(s, d, lx, lx2, h);   break;
			case 0x4:	recvc_mmx(s, d, lx, lx2, h);  break;
			case 0x9:	rech(s, d, lx2, h);       break;
			case 0x8:   rechc(s, d, lx2, h);      break;
		}
	}
	else
#endif
	{
		switch(switcher)
		{
			case 0x3: 	reca(s, d, lx2, h);       break;
			case 0x2:	recac(s, d, lx2, h);      break;
			case 0x1:	rec(s, d, lx2, h);        break;
			case 0x0:	recc(s, d, lx2, h);       break;
			case 0x7:   recva(s, d, lx, lx2, h);  break;
			case 0x6:   recvac(s, d, lx, lx2, h); break;
			case 0x5:	recv(s, d, lx, lx2, h);   break;
			case 0x4:	recvc(s, d, lx, lx2, h);  break;
			case 0x9:	rech(s, d, lx2, h);       break;
			case 0x8:   rechc(s, d, lx2, h);      break;
		}
	}

// Unaccelerated functions
	switch(switcher) 
	{
		case 0xb: 	recha(s, d, lx2, h);      break;
		case 0xa:	rechac(s, d, lx2, h);     break;
		case 0xf: 	rec4a(s, d, lx, lx2, h);  break;
		case 0xe:	rec4ac(s, d, lx, lx2, h); break;
		case 0xd:	rec4(s, d, lx, lx2, h);   break;
		case 0xc:	rec4c(s, d, lx, lx2, h);  break;
	 }
}

/*
	unsigned char *src[]; * prediction source buffer *
	int sfield;           * prediction source field number (0 or 1) *
	unsigned char *dst[]; * prediction destination buffer *
	int dfield;           * prediction destination field number (0 or 1)*
	int lx,lx2;           * horizontal offsets *
	int w,h;              * prediction block/sub-block width, height *
	int x,y;              * pixel co-ordinates of top-left sample in current MB *
	int dx,dy;            * horizontal, vertical motion vector *
	int addflag;          * add prediction error to prediction ? *
*/
static void recon(mpeg3video_t *video, 
		unsigned char *src[], 
		int sfield, 
	    unsigned char *dst[], 
		int dfield, 
		int lx,
		int lx2,
	    int w, 
		int h, 
		int x, 
		int y, 
		int dx, 
		int dy, 
		int addflag)
{

/* Y */
	recon_comp(video, (src[0] + (sfield ? (lx2 >> 1) : 0)), 
	       dst[0] + (dfield ? (lx2 >> 1) : 0),
           lx, lx2, w, h, x, y, dx, dy, addflag);

	if(video->chroma_format != CHROMA444)
	{
      	lx >>= 1; 
		dx /= 2; 
		lx2 >>= 1; 
		w = 0; 
		x >>= 1; 
	}

	if(video->chroma_format == CHROMA420)
	{
      	h >>= 1; 
		dy /= 2; 
		y >>= 1; 
	}

/* Cb */
	recon_comp(video, (src[1] + (sfield ? (lx2 >> 1) : 0)), 
	       dst[1] + (dfield ? (lx2 >> 1) : 0),
	       lx, lx2, w, h, x, y, dx, dy, addflag);

/* Cr */
	recon_comp(video, (src[2] + (sfield ? (lx2 >> 1) : 0)),
	       dst[2] + (dfield ? (lx2 >> 1) : 0),
           lx, lx2, w, h, x, y, dx, dy, addflag);
}

#define WIDTH 1

int mpeg3video_reconstruct(mpeg3video_t *video, 
	int bx, 
	int by, 
	int mb_type, 
	int motion_type,
	int PMV[2][2][2], 
	int mv_field_sel[2][2], 
	int dmvector[2], 
	int stwtype)
{
	int currentfield;
	unsigned char **predframe;
	int DMV[2][2];
	int stwtop, stwbot;

	stwtop = stwtype % 3; /* 0:temporal, 1 : (spat+temp) / 2, 2 : spatial */
	stwbot = stwtype / 3;

	if((mb_type & MB_FORWARD) || (video->pict_type == P_TYPE))
	{
    	if(video->pict_struct == FRAME_PICTURE)
		{
    		if((motion_type == MC_FRAME) || !(mb_type & MB_FORWARD))
			{
/* frame-based prediction */
				{
        			if(stwtop < 2)
        				recon(video, video->oldrefframe, 0, video->newframe, 0,
        	    			video->coded_picture_width, video->coded_picture_width << 1, WIDTH, 8, bx, by,
            			  	PMV[0][0][0], PMV[0][0][1], stwtop);

        			if(stwbot < 2)
        				recon(video, video->oldrefframe, 1, video->newframe, 1,
       	    				video->coded_picture_width, video->coded_picture_width << 1, WIDTH, 8, bx, by,
            				PMV[0][0][0], PMV[0][0][1], stwbot);
    		  	}
    		}
    		else if(motion_type == MC_FIELD) /* field-based prediction */
    		{
/* top field prediction */
        		if(stwtop < 2)
        			recon(video, video->oldrefframe, mv_field_sel[0][0], video->newframe, 0,
            			video->coded_picture_width << 1, video->coded_picture_width << 1, WIDTH, 8, bx, by >> 1,
            			PMV[0][0][0], PMV[0][0][1] >> 1, stwtop);

/* bottom field prediction */
        		if(stwbot < 2)
        			recon(video, video->oldrefframe, mv_field_sel[1][0], video->newframe, 1,
            			video->coded_picture_width << 1, video->coded_picture_width << 1, WIDTH, 8, bx, by >> 1, 
            			PMV[1][0][0], PMV[1][0][1] >> 1, stwbot);
    		}
    		else if(motion_type == MC_DMV)
			{ 
/* dual prime prediction */
/* calculate derived motion vectors */
        		mpeg3video_calc_dmv(video, 
					DMV,
					dmvector,
					PMV[0][0][0],
					PMV[0][0][1] >> 1);

        		if(stwtop < 2)
				{
/* predict top field from top field */
        			recon(video, video->oldrefframe, 0, video->newframe, 0, 
            			video->coded_picture_width << 1, video->coded_picture_width << 1, WIDTH, 8, bx, by>>1, 
            			PMV[0][0][0], PMV[0][0][1] >> 1, 0);

/* predict and add to top field from bottom field */
        			recon(video, video->oldrefframe, 1, video->newframe, 0, 
            			video->coded_picture_width << 1, video->coded_picture_width << 1, WIDTH, 8, bx, by>>1, 
            			DMV[0][0], DMV[0][1], 1);
        		}

        		if(stwbot < 2)
        		{
/* predict bottom field from bottom field */
        			recon(video, video->oldrefframe, 1, video->newframe, 1, 
            			video->coded_picture_width << 1, video->coded_picture_width << 1, WIDTH, 8, bx, by>>1, 
            			PMV[0][0][0], PMV[0][0][1]>>1, 0);

/* predict and add to bottom field from top field */
        			recon(video, video->oldrefframe, 0, video->newframe, 1, 
            			video->coded_picture_width << 1, video->coded_picture_width<<1, WIDTH, 8, bx, by>>1, 
            			DMV[1][0], DMV[1][1], 1);
        		}
    		}
    	  	else
/* invalid motion_type */
/*        		fprintf(stderr, "reconstruct: invalid motion_type\n"); */
				;
    	}
      	else 
      	{
/* TOP_FIELD or BOTTOM_FIELD */
/* field picture */
    		currentfield = (video->pict_struct == BOTTOM_FIELD);

/* determine which frame to use for prediction */
    		if((video->pict_type == P_TYPE) && video->secondfield
        	   && (currentfield != mv_field_sel[0][0]))
        		predframe = video->refframe; /* same frame */
    		else
        	 	predframe = video->oldrefframe; /* previous frame */

    		if((motion_type == MC_FIELD) || !(mb_type & MB_FORWARD))
    		{
/* field-based prediction */
        		if(stwtop < 2)
        			recon(video, predframe,mv_field_sel[0][0],video->newframe,0,
            			video->coded_picture_width << 1,video->coded_picture_width << 1,WIDTH,16,bx,by,
            			PMV[0][0][0],PMV[0][0][1],stwtop);
    		}
    		else 
			if(motion_type == MC_16X8)
    		{
        		if(stwtop < 2)
        		{
        			recon(video, predframe, mv_field_sel[0][0], video->newframe, 0, 
            			video->coded_picture_width << 1, video->coded_picture_width << 1, WIDTH, 8, bx, by, 
            			PMV[0][0][0], PMV[0][0][1], stwtop);

        			/* determine which frame to use for lower half prediction */
        			if((video->pict_type==P_TYPE) && video->secondfield
            		   && (currentfield!=mv_field_sel[1][0]))
            		  predframe = video->refframe; /* same frame */
        			else
            		  predframe = video->oldrefframe; /* previous frame */

        			recon(video, predframe, mv_field_sel[1][0], video->newframe, 0, 
            			video->coded_picture_width << 1, video->coded_picture_width << 1, WIDTH, 8, bx, by+8, 
            			PMV[1][0][0], PMV[1][0][1], stwtop);
        		}
    		}
    		else 
			if(motion_type == MC_DMV) /* dual prime prediction */
    		{
        		if(video->secondfield)
        		  	predframe = video->refframe; /* same frame */
        		else
        		  	predframe = video->oldrefframe; /* previous frame */

/* calculate derived motion vectors */
        		mpeg3video_calc_dmv(video, 
					DMV,
					dmvector,
					PMV[0][0][0],
					PMV[0][0][1]);

/* predict from field of same parity */
        		recon(video, video->oldrefframe, currentfield, video->newframe, 0, 
        			video->coded_picture_width << 1, video->coded_picture_width << 1, WIDTH, 16, bx, by, 
        			PMV[0][0][0], PMV[0][0][1], 0);

/* predict from field of opposite parity */
        		recon(video, predframe, !currentfield, video->newframe, 0, 
        			video->coded_picture_width << 1, video->coded_picture_width << 1, WIDTH, 16, bx, by, 
        			DMV[0][0], DMV[0][1], 1);
    		}
    		else
/* invalid motion_type */
/*        	  fprintf(stderr, "reconstruct: invalid motion_type\n"); */
			;
		}
      	stwtop = stwbot = 1;
	}

	if(mb_type & MB_BACKWARD)
	{
    	if(video->pict_struct == FRAME_PICTURE)
    	{
    		if(motion_type == MC_FRAME)
    		{
/* frame-based prediction */
        		if(stwtop < 2)
        			recon(video, video->refframe, 0, video->newframe, 0, 
            			video->coded_picture_width, video->coded_picture_width << 1, WIDTH, 8, bx, by, 
            			PMV[0][1][0], PMV[0][1][1], stwtop);

        		if(stwbot < 2)
        			recon(video, video->refframe, 1, video->newframe, 1, 
						video->coded_picture_width, video->coded_picture_width << 1, WIDTH, 8, bx, by, 
						PMV[0][1][0], PMV[0][1][1], stwbot);
    		}
    		else 
			{           
/* field-based prediction */
/* top field prediction */
				if(stwtop < 2)
				{
					recon(video, video->refframe, mv_field_sel[0][1], video->newframe, 0,
						(video->coded_picture_width << 1), (video->coded_picture_width<<1), WIDTH, 8, bx, (by >> 1),
						PMV[0][1][0], (PMV[0][1][1] >> 1), stwtop);
				}

/* bottom field prediction */
        		if(stwbot < 2)
				{
        			recon(video, video->refframe, mv_field_sel[1][1], video->newframe, 1, (video->coded_picture_width << 1),
						(video->coded_picture_width << 1), WIDTH, 8, bx, (by>>1),
						PMV[1][1][0], (PMV[1][1][1]>>1), stwbot);
				}
    		}
    	}
    	else 
		{
/* TOP_FIELD or BOTTOM_FIELD */
/* field picture */
    		if(motion_type == MC_FIELD)
			{
/* field-based prediction */
        		recon(video, video->refframe, mv_field_sel[0][1], video->newframe, 0, 
	    			video->coded_picture_width << 1, video->coded_picture_width << 1, WIDTH, 16, bx, by, 
	    			PMV[0][1][0], PMV[0][1][1], stwtop);
    		}
    		else if(motion_type==MC_16X8)
    		{
        		recon(video, video->refframe, mv_field_sel[0][1], video->newframe, 0, 
        			video->coded_picture_width << 1, video->coded_picture_width << 1, WIDTH, 8, bx, by, 
        			PMV[0][1][0], PMV[0][1][1], stwtop);

        		recon(video, video->refframe, mv_field_sel[1][1], video->newframe, 0, 
        			video->coded_picture_width << 1, video->coded_picture_width << 1, WIDTH, 8, bx, by+8, 
        			PMV[1][1][0], PMV[1][1][1], stwtop);
    		}
    		else
/* invalid motion_type */
/*        	  fprintf(stderr, "reconstruct: invalid motion_type\n"); */
			;
    	}
	} /* mb_type & MB_BACKWARD */
	return 0;
}



Bell Labs OSI certified Powered by Plan 9

(Return to Plan 9 Home Page)

Copyright © 2021 Plan 9 Foundation. All Rights Reserved.
Comments to [email protected].