y2touy.asm
上传用户:zhongxx05
上传日期:2007-06-06
资源大小:33641k
文件大小:6k
- ;
- ; ***** BEGIN LICENSE BLOCK *****
- ; Version: RCSL 1.0/RPSL 1.0
- ;
- ; Portions Copyright (c) 1995-2002 RealNetworks, Inc. All Rights Reserved.
- ;
- ; The contents of this file, and the files included with this file, are
- ; subject to the current version of the RealNetworks Public Source License
- ; Version 1.0 (the "RPSL") available at
- ; http://www.helixcommunity.org/content/rpsl unless you have licensed
- ; the file under the RealNetworks Community Source License Version 1.0
- ; (the "RCSL") available at http://www.helixcommunity.org/content/rcsl,
- ; in which case the RCSL will apply. You may also obtain the license terms
- ; directly from RealNetworks. You may not use this file except in
- ; compliance with the RPSL or, if you have a valid RCSL with RealNetworks
- ; applicable to this file, the RCSL. Please see the applicable RPSL or
- ; RCSL for the rights, obligations and limitations governing use of the
- ; contents of the file.
- ;
- ; This file is part of the Helix DNA Technology. RealNetworks is the
- ; developer of the Original Code and owns the copyrights in the portions
- ; it created.
- ;
- ; This file, and the files included with this file, is distributed and made
- ; available on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER
- ; EXPRESS OR IMPLIED, AND REALNETWORKS HEREBY DISCLAIMS ALL SUCH WARRANTIES,
- ; INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY, FITNESS
- ; FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT.
- ;
- ; Technology Compatibility Kit Test Suite(s) Location:
- ; http://www.helixcommunity.org/content/tck
- ;
- ; Contributor(s):
- ;
- ; ***** END LICENSE BLOCK *****
- ;
- ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
- ;;
- ;; YUY2 to UYVY MMX converter.
- ;;
- ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
- %ifdef COFF
- %define YUY2ToUYVY_MMX _YUY2ToUYVY_MMX
- %elifdef WIN32
- %define YUY2ToUYVY_MMX _YUY2ToUYVY_MMX
- %elifdef ELF
- %define YUY2ToUYVY_MMX YUY2ToUYVY_MMX
- %elifdef AOUTB
- %define YUY2ToUYVY_MMX YUY2ToUYVY_MMX
- %else
- %error linking format currently not supported by alphbablend.asm
- %endif
- ;; Export the functions implemented here.
- global YUY2ToUYVY_MMX
- ;========================= DATA SEGMENT ============================
- section .data
- align 8
- ;============================= CODE SEGMENT =======================
- section .text
- ;;
- ;; This is our stack params definition. It is used for both
- ;; YUY2 and UYVY routines as they both take the same parms.
- ;;
- %assign numtemps 4
- %define var(a) [esp+a]
-
- struc parms
- ;Temps on stack
- .tmp1 resd 1 ;General DWORD temp.
- .tmp2 resd 1 ;General DWORD temp.
- .tmp3 resd 1 ;General DWORD temp.
- .tmp4 resd 1 ;General DWORD temp.
-
- ; Space for reg pushes and return address.
- .registers resd 6 ;pushed registers
- .return resd 1 ;return address
- ; input params
- .src: resd 1 ;unsigned char*,
- .dest: resd 1 ;unsigned char*,
- .dx: resd 1 ;ULONG32,
- endstruc
- YUY2ToUYVY_MMX:
- ;; Save some stuff...
- push ebx
- push edi
- push esi
- push ebp
- push ecx
- push edx
- ; Make room for temps on stack
- sub esp, numtemps*4;
- ;; Grab source and dest pointers...
- mov esi, var(parms.src)
- mov edi, var(parms.dest)
- ;; Preload our address add constant
- mov edx, 8
-
- mov ecx, var(parms.dx)
- shr ecx, 3 ; we do 4 macro pixels at a time.
- jnc loop1 ; Do we have a width that is a multiple of 8?
- ;; We have 2 macro pixels left over. Do them here
-
- movq mm0, [esi] ; grab 2 macro pixels from source
- movq mm1, mm0 ; mm1=mm0= VVYYUUYY VVYYUUYY
- psllw mm1, 8 ; mm1 = YY00YY00 YY00YY00
- psrlw mm0, 8 ; mm0 = 00VV00UU 00VV00UU
- por mm0, mm1 ; mm0 = YYVVYYUU YYVVYYUU
- movq [edi], mm0 ; store it.
- add esi, edx
- add edi, edx
- ;; This loops does 16 bytes at a time (4 macro pixels).
- loop1:
- movq mm0, [esi] ; grab 2 macro pixels from source
- add esi, edx
- movq mm1, mm0 ; mm1=mm0= VVYYUUYY VVYYUUYY
- psllw mm1, 8 ; mm1 = YY00YY00 YY00YY00
- psrlw mm0, 8 ; mm0 = 00VV00UU 00VV00UU
- movq mm2, [esi] ; grab 2 macro pixels from source
- por mm0, mm1 ; mm0 = YYVVYYUU YYVVYYUU
- movq mm3, mm2 ; mm1=mm0= VVYYUUYY VVYYUUYY
-
- movq [edi], mm0 ; store it.
- add edi, edx
- psllw mm3, 8 ; mm1 = YY00YY00 YY00YY00
- psrlw mm2, 8 ; mm0 = 00VV00UU 00VV00UU
- por mm2, mm3 ; mm0 = YYVVYYUU YYVVYYUU
- add esi, edx
-
- movq [edi], mm2 ; store it.
-
- ;; Now do the loop calcs....
- add edi, edx
- dec ecx
- jnz loop1
-
- end:
- ;; Free up stack temp var.
- add esp, numtemps*4
-
- ;; Pop off the stack....
- pop edx
- pop ecx
- pop ebp
- pop esi
- pop edi
- pop ebx
- ;; This emms is expensive. If we don't do it we wipe out the
- ;; floating ponts registers but that should be ok.
- ; emms
-
- ;; success
- xor eax, eax
- ret
- ;;; leave a trace
- version: db '$(gfw) Copyright 2001 RealNetworks Inc. Revision:1.0 $',0