2020-09-30 16:53:55 +02:00

872 lines
24 KiB
NASM

;* *************************************************************************
;* INTEL Corporation Proprietary Information
;*
;* This listing is supplied under the terms of a license
;* agreement with INTEL Corporation and may not be copied
;* nor disclosed except in accordance with the terms of
;* that agreement.
;*
;* Copyright (c) 1995 Intel Corporation.
;* All Rights Reserved.
;*
;* *************************************************************************
;* -------------------------------------------------------------------------
;* PVCS Source control information:
;*
;* $Header: S:\h26x\src\dec\dx5aspec.asv 1.2 01 Sep 1995 17:12:12 DBRUCKS $
;*
;* $Log: S:\h26x\src\dec\dx5aspec.asv $
;//
;// Rev 1.2 01 Sep 1995 17:12:12 DBRUCKS
;// fix shaping
;//
;// Rev 1.1 29 Aug 1995 16:49:02 DBRUCKS
;// cleanup comment
;//
;// Rev 1.0 23 Aug 1995 12:20:32 DBRUCKS
;// Initial revision.
;*
;* NOTE:
;* The starting source for this routine came from the PVCS database
;* for the H261 decoder (aspeccor.asm version 1.1, which is a working
;* 16-bit version).
;* -------------------------------------------------------------------------
;////////////////////////////////////////////////////////////////////////////
; AspectCorrect -- This function converts the U & V data from 8 bits to 7 bits
; and moves the data into the YVU9 format the MRV color
; convertors want. Note: the Y data was already converted
; from 8 bits to 7 bits in Convert_Y_8to7_Bit.
;
; if (Input Format == YVU9)
; /* This is needed for looking glass output */
; copy U and V from src to dst
; else { /* Input Format == YVU12 */
; if (shaping) {
; copy Y from src to dst skiping every 12th line
; copy UV from src to dst subsampling and dropping one in 12 lines
; (although not every 12th).
; } else {
; copy UV from src to dst subsampling
; }
; }
;
; Notes:
; * the MRV color converters expect YVU9
; * we may need to drop every 12th line for aspect ratio correction of the
; YVU12 input.
;
; ASSUMPTIONS/LIMITATIONS:
; * IF input in YVU12, only 128x96, 176x144, & 352x288 resolutions are
; supported. YVU9 should support all sizes.
;
;-------------------------------------------------------------------------------
include decconst.inc
ifndef WIN32
.MODEL SMALL
endif
.486
ifdef WIN32
.MODEL FLAT
.DATA
else ;; WIN16
_DATA SEGMENT PUBLIC 'DATA'
endif
;; Toss lines for aspect ratio correction 12 to 9
;; 6, 19, 30, 43, 54, 67,
;; 78, 91,102,115,126,139
;; Lookup Table for 8->7 bit conversion and clamping.
;; U and V range from 16..240->8..120
gTAB_UVtbl8to7 BYTE 8, 8, 8, 8, 8, 8, 8, 8
BYTE 8, 8, 8, 8, 8, 8, 8, 8
BYTE 8, 8, 9, 9, 10, 10, 11, 11
BYTE 12, 12, 13, 13, 14, 14, 15, 15
BYTE 16, 16, 17, 17, 18, 18, 19, 19
BYTE 20, 20, 21, 21, 22, 22, 23, 23
BYTE 24, 24, 25, 25, 26, 26, 27, 27
BYTE 28, 28, 29, 29, 30, 30, 31, 31
BYTE 32, 32, 33, 33, 34, 34, 35, 35
BYTE 36, 36, 37, 37, 38, 38, 39, 39
BYTE 40, 40, 41, 41, 42, 42, 43, 43
BYTE 44, 44, 45, 45, 46, 46, 47, 47
BYTE 48, 48, 49, 49, 50, 50, 51, 51
BYTE 52, 52, 53, 53, 54, 54, 55, 55
BYTE 56, 56, 57, 57, 58, 58, 59, 59
BYTE 60, 60, 61, 61, 62, 62, 63, 63
BYTE 64, 64, 65, 65, 66, 66, 67, 67
BYTE 68, 68, 69, 69, 70, 70, 71, 71
BYTE 72, 72, 73, 73, 74, 74, 75, 75
BYTE 76, 76, 77, 77, 78, 78, 79, 79
BYTE 80, 80, 81, 81, 82, 82, 83, 83
BYTE 84, 84, 85, 85, 86, 86, 87, 87
BYTE 88, 88, 89, 89, 90, 90, 91, 91
BYTE 92, 92, 93, 93, 94, 94, 95, 95
BYTE 96, 96, 97, 97, 98, 98, 99, 99
BYTE 100,100,101,101,102,102,103,103
BYTE 104,104,105,105,106,106,107,107
BYTE 108,108,109,109,110,110,111,111
BYTE 112,112,113,113,114,114,115,115
BYTE 116,116,117,117,118,118,119,119
BYTE 120,120,120,120,120,120,120,120
BYTE 120,120,120,120,120,120,120,120
_DATA ENDS
ifdef WIN32
.CODE
assume cs : flat
assume ds : flat
assume es : flat
assume fs : flat
assume gs : flat
else
_TEXT32 SEGMENT PUBLIC READONLY USE32 'CODE'
ASSUME DS:_DATA
ASSUME CS:_TEXT32
ASSUME ES:nothing
ASSUME FS:nothing
ASSUME GS:nothing
endif
;C function prototype
;
;long AspectCorrect(
; HPBYTE pYPlaneInput, /*ptr Y plane*/
; HPBYTE pVPlaneInput, /*ptr V plane*/
; HPBYTE pUPlaneInput, /*ptr U plane*/
; DWORD YResolution, /*Y plane height*/
; DWORD XResolution, /*Y plane width*/
; WORD far * pyNewHeight, /*Pitch of Y plane in*/
; DWORD YVU9InputFlag, /*flag = YUV9 or YUV12*/
; HPBYTE pYPlaneOutput, /*pYOut*/
; HPBYTE pVPlaneOutput, /*pUOut*/
; DWORD YPitchOut, /*Pitch of Y plane out*/
; DWORD ShapingFlag /*flag = Shaping or not*/
; )
PUBLIC _AspectCorrect
ifdef WIN32
_AspectCorrect proc
else
_AspectCorrect proc far
; parmD pYPlaneIn ;ptr to Y input plane
; parmD pVPlaneIn ;ptr to V input plane
; parmD pUPlaneIn ;ptr to U input plane
; parmD YRes ;Y plane height
; parmD XRes ;Y plane width
; parmD pYNewHeight ;Pitch of Y plane input
; parmD YVU9Flag ;Flag=1 if YUV9
; parmD pYPlaneOut ;ptr to Y output plane
; parmD pVPlaneOut ;ptr to V output plane
; parmD YPitchOut ;Pitch of Y plane output
; parmD ShapingFlag ;Flag=1 if Shaping
endif
;set up equates
pYPlaneIn EQU DWORD PTR[ebp+8]
pVPlaneIn EQU DWORD PTR[ebp+12]
pUPlaneIn EQU DWORD PTR[ebp+16]
YRes EQU DWORD PTR[ebp+20]
XRes EQU DWORD PTR[ebp+24]
pYNewHeight EQU DWORD PTR[ebp+28]
YVU9Flag EQU DWORD PTR[ebp+32]
pYPlaneOut EQU DWORD PTR[ebp+36]
pVPlaneOut EQU DWORD PTR[ebp+40]
YPitchOut EQU DWORD PTR[ebp+44]
ShapingFlag EQU DWORD PTR[ebp+48]
;; stack usage
; previous ebp at ebp
; previous edi at ebp - 4
; previous esi at ebp - 8
; lXRes at ebp -12
; lYRes at ebp -16
; lYPitchOut at ebp -20
; YDiff at ebp -24
; outloopcnt at ebp -28
; uvWidth at ebp -32
; inloopcnt at ebp -36
; luvcounter at ebp -40
; uvoutloopcnt at ebp -44
; VDiff at ebp -48
; VInDiff at ebp -52
lXRes EQU DWORD PTR[ebp-12]
lYRes EQU DWORD PTR[ebp-16]
lYPitchOut EQU DWORD PTR[ebp-20]
YDiff EQU DWORD PTR[ebp-24]
outloopcnt EQU DWORD PTR[ebp-28]
uvWidth EQU DWORD PTR[ebp-32]
inloopcnt EQU DWORD PTR[ebp-36]
luvcounter EQU DWORD PTR[ebp-40]
uvoutloopcnt EQU DWORD PTR[ebp-44]
VDiff EQU DWORD PTR[ebp-48]
VInDiff EQU DWORD PTR[ebp-52]
xor ax,ax ; These two instructions give definitive proof we are
mov eax,0CCCCCCCCH ; in a 32-bit code segment. INT 3 occurs if not.
;get params
push ebp
ifdef WIN32
mov ebp, esp
else
movzx ebp, sp ;ebp now pointing to last pushed reg
endif
push edi
push esi
; zero out registers
xor edx, edx
xor esi, esi
xor edi, edi
; move stack variables to local space
mov eax, XRes
push eax ; store lXRes on stack
mov ebx, YRes
push ebx ; store lYRes on stack
mov ecx, YPitchOut
push ecx ; store lYpitchOut on stack
sub ecx, eax ; YDiff = YPitchOut - XRes
push ecx ; store YDiff on stack
; push stack with 0 6 additional times to make room for other locals
push edx ; outloopcnt
push edx ; uvWidth
push edx ; inloopcnt
push edx ; luvcounter
push edx ; uvoutloopcnt
push edx ; VDiff
push edx ; VInDiff
; test if YUV9 mode
mov edx, YVU9Flag
test edx,edx
jz YVU12; ; If the flag is false it must be YVU12
;**********************************************************************
;**********************************************************************
; know input was YVU9, Y Plane was processed in cc12to7.asm
mov esi, pYNewHeight
mov WORD PTR [esi], bx ; store YRes into address pYNewHeight
; ********************
; Copy V and U Plane from source to destination converting to 7 bit
; ********************
; Description of V & U Plane processing:
; - Double nested loop with
; Outlp1 executed YRes/4 lines
; Collp1 loops for number of columns
; - Read 1 U
; - Read 1 V
; - Convert each value from 8-bit to 7-bit
; - Store 1 U
; - Store 1 V
;
; Register usage
; eax U plane input address
; ebx source value and index into gTAB_UVtbl8to7
; ecx source value and index into gTAB_UVtbl8to7
; edx inner most loop counter
; esi V plane src address
; edi des address
; ebp stack pointer stuff
;
; if (16-bit)
; es input plane segment
; fs output plane segment
; ds table segment
; endif
;
; local variables
; outloopcnt
; lXRes
; lYRes
; uvWidth
; VDiff
;
; know input was YVU9
mov ecx, lYRes
mov ebx, lXRes
shr ebx, 2 ; uvWidth=XRes/4
mov eax, VPITCH ; get Fixed offset
shr ecx, 2 ; outloopcnt=YRes/4
mov uvWidth,ebx ; uvWidth=XRes/4
sub eax, ebx ; VPITCH - uvWidth
mov esi, pVPlaneIn ; Initialize input cursor
mov edi, pVPlaneOut ; Initialize output cursor
mov VDiff, eax ; store V difference
mov eax, pUPlaneIn ; Initialize input cursor
Row9lp2:
mov outloopcnt,ecx ; store updated outer loop count
mov edx, uvWidth ; init dx
xor ebx, ebx
xor ecx, ecx
Col9lpv1:
mov cl, BYTE PTR [eax] ; Fetch *PUtemp_IN
inc edi ; Inc des by 1, PVtemp_OUT++
mov bl, BYTE PTR [esi] ; Fetch *pVtemp_IN
inc eax ; pUtemp+=1
mov cl, gTAB_UVtbl8to7[ecx] ; cl = gTAB_UVtbl8to7[*pUtemp_IN]
inc esi ; Inc source by 1,pVtemp+=1
mov BYTE PTR [edi+167],cl ; store in PUtemp_OUT
mov bl, gTAB_UVtbl8to7[ebx] ; bl = gTAB_UVtbl8to7[*pVtemp_IN]
mov BYTE PTR [edi-1],bl ; store in PVtemp_OUT
xor ecx, ecx ; dummy op
dec edx
jg Col9lpv1
;; increment to beginning of next line
mov edx, VDiff
mov ecx, outloopcnt ; get outer loop count
add edi,edx ; Point to next output row
dec ecx
jnz Row9lp2 ; if more to do loop
jmp Cleanup
;*****************************************************************
;*****************************************************************
; know input was YVU12
;
; if (!ShapingFlag) {
; goto YVU12_NO_SHAPING;
; } else {
; switch (YRes) { // YRes = YRes * 11 / 12;
; case 96: *pyNewHeight = 88; break;
; case 144: *pyNewHeight = 132; break;
; case 288: *pyNewHeight = 264; break;
; default: error;
; }
; }
;
YVU12:
mov eax, ShapingFlag
test eax, eax
jz YVU12_NO_SHAPING
cmp lYRes, 96 ; If 96
je YRes96
cmp lYRes, 144 ; If 144
je YRes144
cmp lYRes, 288 ; If 288
je YRes288
jmp Error
;
YRes96:
mov ax, 88 ; pyNewHeight = ax = 132
mov ecx, 7 ; for YRes lines loopcounter=11
mov uvoutloopcnt, 1 ; process 1 full set of 13&11 lines
jmp Rejoin2
YRes144:
mov ax, 132 ; pyNewHeight = ax = 132
mov ecx, 11 ; for YRes lines loopcounter=11
mov uvoutloopcnt, 2 ; process 2 full sets of 13&11 lines
jmp Rejoin2
YRes288:
mov ax, 264 ; pyNewHeight = ax = 264
mov ecx, 23 ; for YRes lines loopcounter=23
mov uvoutloopcnt, 5 ; process 5 full sets of 13&11 lines
Rejoin2:
mov esi, pYNewHeight
mov [esi], ax ; store adjusted height into
; address pYNewHeight
; ********************
; Copy Y Plane from soure to dest skipping every 12th line
; ********************
; Description of YPlane processing:
;
; Triple nested loop with
; Outlp1 executed 11 or 23 times based on 144 or 288 lines respectively
; Rowlp1 is executed 11 times
; Collp1 loops for number of columns
;
; Register usage
; eax rows loop count
; ebx input and output
; ecx outer loop count
; edx column loop counter
; esi src address
; edi des address
; ebp stack pointer stuff
;
; es input plane segment
; fs output plane segment
; ds table segment
;
; local variables
; lXRes
; YDiff
; lYPitchOut
;
mov esi, pYPlaneIn ; Initialize input cursor
mov edi, pYPlaneOut ; Initialize output cursor
; No need to re-copy first 11 lines
mov eax, lYPitchOut
mov edx, YDiff
add edi, eax ; des + 1*lYPitchOut
shl eax, 1 ; lYPitchOut*2
;;; add esi, edx ; Adjust for difference in YPitchOut
; and XRes
add edi, eax ; des + 3*lYpitchOut
shl eax, 1 ; lYPirchOut*4
;;; add edi, edx ; Adjust for difference in YPitchOut
; and XRes
add esi, eax ; source + 4*lYpitchOut
shl eax, 1 ; lYPitchOut*8
add esi, eax ; source +12*lYpitchOut
add edi, eax ; des + 11*lYPitchOut
Outlp1:
mov eax, 11 ; Initialize rows loop cnter
mov edx, lXRes ; edx = number of columns
Rowlp1:
Collp1:
mov ebx, [esi+edx-4] ; Fetch source, 4 at a time
sub edx,4 ; decrement loop counter
mov [edi+edx],ebx ; Store 4 converted values
jnz Collp1 ; if not done loop
mov edx, lYPitchOut
mov ebx, YDiff
add edi, edx ; Increment to where just processed
add esi, edx
;;; add edi, ebx ; Adjust for difference in YPitchOut
;;; add esi, ebx ; and XRes
dec eax ; decrement rows loop counter
jg Rowlp1
mov eax,lYPitchOut ; Skip 12th line
add esi,eax ; Point to next input row
dec ecx ; decrement outer loop counter
jg Outlp1 ; if more to do loop
; ************************************************************
; Copy V and U Plane from source to destination converting to 7 bit
; skipping every other line and sometimes two moving only ever other
; pixel in a row.
; ********************
;
; Description of V & U Plane processing:
; - Double nested loop with
; Outlp1 executed YRes/4 lines
; Collp1 loops for number of columns
; - Read 1 U
; - Read 1 V
; - Convert each value from 8-bit to 7-bit
; - Store 1 U
; - Store 1 V
;
; Register usage
; eax U plane input address
; ebx source value and index into gTAB_UVtbl8to7
; ecx source value and index into gTAB_UVtbl8to7
; edx counter
; esi V plane src address
; edi des address, V Plane and U Plane
; ebp stack pointer stuff
;
; es input plane segment
; fs output plane segment
; ds table segment
;
; local variables
; luvcounter
; uvoutloopcnt
; inloopcnt
; lXRes
; uvWidth
; VDiff
;
mov ebx, lXRes
mov eax, VPITCH ; get Fixed offset
shr ebx, 1 ; uvWidth=XRes/2
mov uvWidth, ebx ; uvWidth=XRes/2
shr ebx, 1
sub eax, ebx ; VPITCH - uvWidth
mov VDiff, eax ; store V difference
mov luvcounter, ebx ; luvcounter = XRes/4
mov ecx, YPITCH ; Distance to the next V
add ecx, ecx
sub ecx, uvWidth
mov VInDiff, ecx ; = YPITCH + YPITCH - uvWidth
mov esi, pVPlaneIn ; Initialize input cursor
mov edi, pVPlaneOut ; Initialize output cursor
mov eax, pUPlaneIn ; Initialize input cursor
; Process 6 first lines special
mov ebx, 3 ; initialize inner loop count
Rowlp2_6:
mov edx, luvcounter ; init dx
mov inloopcnt, ebx ; store updated inloopcnt
xor ebx, ebx
xor ecx, ecx
Collpv1:
mov cl, BYTE PTR [eax] ; Fetch *PUtemp_IN
inc edi ; Inc des by 1, PVtemp_OUT++
mov bl, BYTE PTR [esi] ; Fetch *pVtemp_IN
add eax,2 ; pUtemp+=2
mov cl, gTAB_UVtbl8to7[ecx] ; cl = gTAB_UVtbl8to7[*pUtemp_IN]
add esi,2 ; Inc source by 2,pVtemp+=2
mov BYTE PTR [edi+167],cl; store in PUtemp_OUT
mov bl, gTAB_UVtbl8to7[ebx] ; bl = gTAB_UVtbl8to7[*pVtemp_IN]
mov BYTE PTR [edi-1],bl ; store in PVtemp_OUT
xor ecx, ecx ; dummy op
dec edx
jg Collpv1
; increment to beginning of next line then skip next input line
add edi,VDiff ; Point to next output row
mov edx,VInDiff ; Skip to next input row
add esi,edx ;
add eax,edx ;
; test if have processed 6 lines yet
mov ebx, inloopcnt
dec ebx
jg Rowlp2_6 ; if more to do loop
; Skipping extra line
mov edx,YPITCH ; Need same sized for add
mov ecx, uvoutloopcnt
add esi,edx ; Point to next input row
add eax,edx ; Point to next input row
; Process groups of 13 and 11 lines
Outlp2:
; Process 13 lines
mov ebx, 6 ; initialize inner loop count
mov uvoutloopcnt, ecx
Rowlp2_13:
mov edx, luvcounter ; init dx
mov inloopcnt, ebx ; store updated inloopcnt
xor ebx, ebx
xor ecx, ecx
Collpv1_13:
mov cl, BYTE PTR [eax] ; Fetch *PUtemp_IN
inc edi ; Inc des by 1, PVtemp_OUT++
mov bl, BYTE PTR [esi] ; Fetch *pVtemp_IN
add eax,2 ; pUtemp+=2
mov cl, gTAB_UVtbl8to7[ecx] ; cl = gTAB_UVtbl8to7[*pUtemp_IN]
add esi,2 ; Inc source by 2,pVtemp+=2
mov BYTE PTR [edi+167],cl; store in PUtemp_OUT
mov bl, gTAB_UVtbl8to7[ebx] ; bl = gTAB_UVtbl8to7[*pVtemp_IN]
mov BYTE PTR [edi-1],bl ; store in PVtemp_OUT
xor ecx, ecx ; dummy op
dec edx
jg Collpv1_13
; increment to beginning of next line then skip next input line
add edi,VDiff ; Point to next output row
mov edx,VInDiff ; Skip to next input row
add esi,edx ;
add eax,edx ;
; test if have processed 13 lines yet
mov ebx, inloopcnt
dec ebx
jg Rowlp2_13 ; if more to do loop
; Skipping extra line
mov edx,YPITCH ; Need same sized for add
mov ebx, 5 ; initialize inner loop count
add esi,edx ; Point to next input row
add eax,edx ; Point to next input row
; Process 11 lines
Rowlp2_11:
mov edx, luvcounter ; init dx
mov inloopcnt, ebx ; store updated inloopcnt
xor ebx, ebx
xor ecx, ecx
Collpv1_11:
mov cl, BYTE PTR [eax] ; Fetch *PUtemp_IN
inc edi ; Inc des by 1, PVtemp_OUT++
mov bl, BYTE PTR [esi] ; Fetch *pVtemp_IN
add eax,2 ; pUtemp+=2
mov cl, gTAB_UVtbl8to7[ecx] ; cl = gTAB_UVtbl8to7[*pUtemp_IN]
add esi,2 ; Inc source by 2,pVtemp+=2
mov BYTE PTR [edi+167],cl; store in PUtemp_OUT
mov bl, gTAB_UVtbl8to7[ebx] ; bl = gTAB_UVtbl8to7[*pVtemp_IN]
mov BYTE PTR [edi-1],bl ; store in PVtemp_OUT
xor ecx, ecx ; dummy op
dec edx
jg Collpv1_11
; increment to beginning of next line, then skip next input line
add edi, VDiff ; Point to next output row
mov edx,VInDiff ; Skip to next input row
add esi,edx ;
add eax,edx ;
; test if have processed 11 lines yet
mov ebx, inloopcnt
dec ebx
jg Rowlp2_11 ; if more to do loop
; Skipping extra line
mov edx,YPITCH ; Need same sized for add
mov ecx, uvoutloopcnt
add esi,edx ; Point to next input row
add eax,edx ; Point to next input row
dec ecx
jnz Outlp2 ; if more to do loop
;
; Process last set of 13
;
mov ebx, 6 ; initialize inner loop count
Rowlp2_13l:
mov edx, luvcounter ; init dx
mov inloopcnt, ebx ; store updated inloopcnt
xor ebx, ebx
xor ecx, ecx
Collpv1_13l:
mov cl, BYTE PTR [eax] ; Fetch *PUtemp_IN
inc edi ; Inc des by 1, PVtemp_OUT++
mov bl, BYTE PTR [esi] ; Fetch *pVtemp_IN
add eax,2 ; pUtemp+=2
mov cl, gTAB_UVtbl8to7[ecx] ; cl = gTAB_UVtbl8to7[*pUtemp_IN]
add esi,2 ; Inc source by 2,pVtemp+=2
mov BYTE PTR [edi+167],cl; store in PUtemp_OUT
mov bl, gTAB_UVtbl8to7[ebx] ; bl = gTAB_UVtbl8to7[*pVtemp_IN]
mov BYTE PTR [edi-1],bl ; store in PVtemp_OUT
xor ecx, ecx ; dummy op
dec edx
jg Collpv1_13l
; increment to beginning of next line then skip next input line
add edi,VDiff ; Point to next output row
mov edx,VInDiff ; Skip to next input row
add esi,edx ;
add eax,edx ;
; test if have processed 13 lines yet
mov ebx, inloopcnt
dec ebx
jg Rowlp2_13l ; if more to do loop
; Skipping extra line
mov edx,YPITCH ; Need same sized for add
mov ebx, 2 ; initialize inner loop count
add esi,edx ; Point to next input row
add eax,edx ; Point to next input row
; Process final 4 lines
Rowlp2_f:
mov edx, luvcounter ; init dx
mov inloopcnt, ebx
xor ebx, ebx
xor ecx, ecx
Collpv1_f:
mov cl, BYTE PTR [eax] ; Fetch *PUtemp_IN
inc edi ; Inc des by 1, PVtemp_OUT++
mov bl, BYTE PTR [esi] ; Fetch *pVtemp_IN
add eax,2 ; pUtemp+=2
mov cl, gTAB_UVtbl8to7[ecx] ; cl = gTAB_UVtbl8to7[*pUtemp_IN]
add esi,2 ; Inc source by 2,pVtemp+=2
mov BYTE PTR [edi+167],cl; store in PUtemp_OUT
mov bl, gTAB_UVtbl8to7[ebx] ; bl = gTAB_UVtbl8to7[*pVtemp_IN]
mov BYTE PTR [edi-1],bl ; store in PVtemp_OUT
xor ecx, ecx ; dummy op
dec edx
jg Collpv1_f
; increment to beginning of next line then skip next input line
add edi, VDiff ; Point to next output row
mov edx,VInDiff ; Skip to next input row
add esi,edx ;
add eax,edx ;
; test if have processed last lines yet
mov ebx, inloopcnt
dec ebx
jg Rowlp2_f ; if more to do loop
jmp Cleanup
; ************************************************************
; Copy V and U Plane from source to destination converting to 7 bit
; skipping every other line moving only ever other pixel in a row.
; ********************
;
; Description of V & U Plane processing:
; - Double nested loop with
; Outlp1 executed YRes/4 lines
; Collp1 loops for number of columns
; - Read 1 U
; - Read 1 V
; - Convert each value from 8-bit to 7-bit
; - Store 1 U
; - Store 1 V
;
; Register usage
; eax U plane input address
; ebx source value and index into gTAB_UVtbl8to7
; ecx source value and index into gTAB_UVtbl8to7
; edx counter
; esi V plane src address
; edi des address, V Plane and U Plane
; ebp stack pointer stuff
;
; es input plane segment
; fs output plane segment
; ds table segment
;
; local variables
; luvcounter
; inloopcnt
; lYRes
; lXRes
; uvWidth
; VDiff
; VInDiff
;
YVU12_NO_SHAPING:
cmp lYRes, 98
je YRes98_NS
cmp lYRes, 144
je YRes144_NS
cmp lYRes, 288
je YRes288_NS
jmp Error
;
YRes98_NS: ; 98 No Shaping
YRes144_NS: ; 144 No Shaping
YRes288_NS: ; 288 No Shaping
mov eax, lYRes ; pyNewHeight = ax = YRes
mov esi, pYNewHeight
mov [esi], ax ; store adjusted height into
shr eax, 2 ; inloopcnt=YRes/2
mov ebx, lXRes
shr ebx, 1 ; uvWidth=XRes/2
mov inloopcnt, eax ; initialize inner loop count
mov uvWidth, ebx ; uvWidth=XRes/2
mov ecx, VPITCH ; get output plane V pitch
shr ebx, 1
sub ecx, ebx ; VPITCH - uvWidth/2
mov luvcounter, ebx ; luvcounter = XRes/4
mov VDiff, ecx ; Store VDiff
mov ecx, YPITCH ; Distance to the next V
add ecx, ecx
sub ecx, uvWidth
mov VInDiff, ecx ; = YPITCH + YPITCH - uvWidth
mov esi, pVPlaneIn ; Initialize input cursor
mov edi, pVPlaneOut ; Initialize output cursor
mov eax, pUPlaneIn ; Initialize input cursor
mov ecx, inloopcnt
; Process all lines skipping just every other
Rowlp2_NS:
mov inloopcnt, ecx ; store update inloopcnt
xor ebx, ebx
mov edx, luvcounter ; init dx
xor ecx, ecx
Collpv1_NS:
mov cl, BYTE PTR [eax] ; Fetch *PUtemp_IN
inc edi ; Inc des by 1, PVtemp_OUT++
mov bl, BYTE PTR [esi] ; Fetch *pVtemp_IN
add eax,2 ; pUtemp+=2
mov cl, gTAB_UVtbl8to7[ecx] ; cl = gTAB_UVtbl8to7[*pUtemp_IN]
add esi,2 ; Inc source by 2,pVtemp+=2
mov BYTE PTR [edi+167],cl; store in PUtemp_OUT
mov bl, gTAB_UVtbl8to7[ebx] ; bl = gTAB_UVtbl8to7[*pVtemp_IN]
mov BYTE PTR [edi-1],bl ; store in PVtemp_OUT
xor ecx, ecx ; dummy op
dec edx
jg Collpv1_NS
; increment to beginning of next line then skip next input line
add edi, VDiff ; Point to next output row
mov edx,VInDiff ; Skip to next input row
add esi,edx ;
add eax,edx ;
mov ecx, inloopcnt ; get inloopcnt
; test if have processed all lines yet
dec ecx ; Process next line
jne Rowlp2_NS ; if more to do loop
Error:
Cleanup:
; clean out local variables on stack
pop ecx
pop ebx
pop ecx
pop ebx
pop ecx
pop ebx
pop ecx
pop ebx
pop ecx
pop ebx
pop ecx
;clear special seg registers, restore stack, pop saved registers
ifndef WIN32
xor ecx, ecx
xor ebx, ebx
mov es, cx
mov fs, bx
endif
pop esi
pop edi
pop ebp
ifdef WIN32
ret
else
db 066h
retf
endif
_AspectCorrect endp
END