BitmapCopyInfo
--------------
0x0 4 void* sourceImageBuffer
0x4 4 void* destImageBuffer
0x8 4 void* overlayMask [blight or day and night]
0xC 4 int overlayMaskBitOffset
0x10 4 int width
0x14 4 int height
0x18 4 int sourcePitch
0x1C 4 int destPitch
0x20 4 enum DrawMethod drawMethod
0x24 4 union
0x24 4 short[256]* darkPal16 [current light level]
0x24 4 int bitXOffset [For 1 bpp images]
0x28 4 int blightOverlay [0..15]
0x2C 4 short[256]* lightPal16 [full daylight]
---------------
void __cdecl DrawSprite(BitmapCopyInfo* bitmapCopyInfo);
00586CEF > >PUSH EBP ; Function: DrawSprite(BitmapCopyInfo* bitmapCopyInfo)
00586CF0 >MOV EBP,ESP
00586CF2 >PUSHAD
00586CF3 >MOV EBP,DWORD PTR SS:[EBP+8] ; EBP := [param1] BitmapCopyInfo* bitmapCopyInfo
00586CF6 >MOV ECX,DWORD PTR SS:[EBP+20] ; ECX := BitmapCopyInfo.drawMethod
00586CF9 >SHL ECX,2 ; [ECX := drawMethod * 4]
00586CFC >MOV EDI,DWORD PTR DS:[ECX+586CDF]
00586D02 >SUB EDI,Outpost2.00586D3C ; [* Calculate offset from end of CALL instruction *]
00586D08 >MOV DWORD PTR DS:[586D38],EDI ; [* Hardcode CALL address into instruction *]
00586D0E >MOV EAX,DWORD PTR SS:[EBP+18] ; EAX := BitmapCopyInfo.sourcePitch
00586D11 >MOV EBX,DWORD PTR SS:[EBP+10] ; EBX := BitmapCopyInfo.sourceWidth
00586D14 >MOV EDX,EBX
00586D16 >MOV ESI,DWORD PTR SS:[EBP+1C] ; ESI := BitmapCopyInfo.destPitch
00586D19 >SHL EDX,1
00586D1B >SUB ESI,EDX
00586D1D >SUB EAX,EBX ; EAX := sourcePitch - sourceWidth
00586D1F >MOV DWORD PTR DS:[<int destPitchDelta>],ESI ; [global] int destPitchDelta := ESI
00586D25 >MOV DWORD PTR DS:[<int sourcePitchDelta>],EAX ; [global] int sourcePitchDelta := EAX
00586D2A >MOV ESI,DWORD PTR SS:[EBP] ; ESI := BitmapCopyInfo.sourceImageBuffer*
00586D2D >MOV EDI,DWORD PTR SS:[EBP+4] ; EDI := BitmapCopyInfo.destImageBuffer*
00586D30 >MOV ECX,DWORD PTR SS:[EBP+10] ; [LoopStart]: ECX := BitmapCopyInfo.sourceWidth
00586D33 >PUSH EBP ; [Save EBP]
00586D34 >MOV EBP,DWORD PTR SS:[EBP+24] ; EBP := BitmapCopyInfo.darkPal16*
00586D37 >CALL 128CC3B4
00586D3C >POP EBP ; [Restore EBP]
00586D3D >ADD ESI,DWORD PTR DS:[<int sourcePitchDelta>] ; ESI := sourceImageBuffer* + sourcePitchDelta
00586D43 >ADD EDI,DWORD PTR DS:[<int destPitchDelta>] ; EDI := destImageBuffer* + destPitchDelta
00586D49 >DEC DWORD PTR SS:[EBP+14] ; BitmapCopyInfo.sourceHeight--
00586D4C ^ >JNZ SHORT Outpost2.00586D30 ; -> LoopStart
00586D4E >POPAD
00586D4F >LEAVE
00586D50 >RETN
00586D51 > >MOV EDX,EBP ; Function: DrawScanline8Pal16Transparent0
00586D53 >SHR ECX,1
00586D55 >JNB SHORT Outpost2.00586D6D
00586D57 >MOVZX EAX,BYTE PTR DS:[ESI] ; EAX := *sourceImageBuffer
00586D5A >ADD EAX,EAX ; [EAX := sourcePixel * 2]
00586D5C >JE SHORT Outpost2.00586D65
00586D5E >MOV AX,WORD PTR DS:[EAX+EDX] ; AX := pal16[sourcePixel * 2]
00586D62 >MOV WORD PTR DS:[EDI],AX ; *destImageBuffer := AX
00586D65 >INC ESI ; ESI := sourceImageBuffer*++
00586D66 >ADD EDI,2 ; EDI := destImageBuffer* += 2
00586D69 >OR ECX,ECX
00586D6B >JE SHORT Outpost2.00586D96 ; -> Return
00586D6D >XOR EBX,EBX ; [LoopStart]:
00586D6F >XOR EAX,EAX
00586D71 >MOV BL,BYTE PTR DS:[ESI+1] ; BL := *(sourceImageBuffer + 1)
00586D74 >MOV AL,BYTE PTR DS:[ESI] ; AL := *sourceImageBuffer
00586D76 >ADD EBX,EBX ; [EBX := sourcePixel2 * 2]
00586D78 >JE SHORT Outpost2.00586D97
00586D7A >ADD EAX,EAX ; [EAX := sourcePixel1 * 2]
00586D7C >JE SHORT Outpost2.00586DAC
00586D7E >MOV BX,WORD PTR DS:[EBX+EDX] ; [DrawBothPixels]: BX := pal16[sourcePixel2 * 2]
00586D82 >ADD ESI,2 ; ESI := sourceImageBuffer* += 2
00586D85 >MOV AX,WORD PTR DS:[EAX+EDX] ; AX := pal16[sourcePixel1 * 2]
00586D89 >SHL EBX,10 ; EBX := destPixel2 << 16
00586D8C >OR EAX,EBX ; EAX := destPixel1 | (destPixel2 << 16)
00586D8E >MOV DWORD PTR DS:[EDI],EAX ; *destImageBuffer := EAX
00586D90 >ADD EDI,4 ; EDI := destImageBuffer* += 4
00586D93 >DEC ECX
00586D94 ^ >JNZ SHORT Outpost2.00586D6D ; -> LoopStart
00586D96 >RETN
00586D97 >ADD EAX,EAX ; [EAX := sourcePixel1 * 2]
00586D99 >JE SHORT Outpost2.00586DA2 ; -> Skip drawing pixels
00586D9B >MOV BX,WORD PTR DS:[EAX+EDX] ; [DrawFirstPixelOnly]:
00586D9F >MOV WORD PTR DS:[EDI],BX ; *destImageBuffer := BX
00586DA2 >ADD ESI,2 ; [LoopEpilog]: ESI := sourceImageBuffer* += 2
00586DA5 >ADD EDI,4 ; EDI := destImageBuffer* += 4
00586DA8 >DEC ECX
00586DA9 ^ >JNZ SHORT Outpost2.00586D6D ; -> LoopStart
00586DAB >RETN
00586DAC >MOV AX,WORD PTR DS:[EBX+EDX] ; [DrawSecondPixelOnly]: AX := pal16[sourcePixel2 * 2]
00586DB0 >ADD ESI,2 ; ESI := sourceImageBuffer* += 2
00586DB3 >MOV WORD PTR DS:[EDI+2],AX ; *(destImageBuffer + 2) := AX
00586DB7 >ADD EDI,4 ; EDI := destImageBuffer* += 4
00586DBA >DEC ECX
00586DBB ^ >JNZ SHORT Outpost2.00586D6D ; -> LoopStart
00586DBD >RETN
// About 14% faster
__asm
{
sub esp, 0x8
push ebx
push esi
push edi
push ebp
; Make sure we have something to draw
mov edx, [ecx + 0x14]; height
mov ebx, [ecx + 0x10]; width
or edx, edx
jz Return
or ebx, ebx
jz Return
; Precalculate
lea esi, [ebx * 2] ; width*2
mov eax, [ecx + 0x18]; sourcePitch
mov edi, [ecx + 0x1C]; destPitch
sub eax, ebx ; sourcePitch - width
sub edi, esi ; destPitch - width*2
mov [esp + 0x10], eax; sourcePitchDelta
mov [esp + 0x14], edi; destPitchDelta
; Cache values in registers
mov esi, [ecx] ; sourceImage*
mov edi, [ecx + 0x4]; destImage*
mov ebp, [ecx + 0x24]; palette16*
mov ecx, ebx ; width
DrawPixelLoopStart:
mov al, [esi]
inc esi
;lodsb
or al, al
jz SkipPixelDraw
movzx eax, al
mov ax, [ebp + eax*2]
;stosw
mov [edi], ax
SkipPixelDraw:
add edi, 2
dec ecx
jnz DrawPixelLoopStart
mov ecx, ebx ; width
add esi, [esp + 0x10]; sourcePitchDelta
add edi, [esp + 0x14]; destPitchDelta
dec edx ; heightRemaining
jnz DrawPixelLoopStart
Return:
pop ebp
pop edi
pop esi
pop ebx
add esp, 0x8
}
// About 5% faster
__asm
{
sub esp, 0xC
; push ebx
push esi
push edi
push ebp
; Make sure we have something to draw
mov edx, [ecx + 0x14]; height
mov ebx, [ecx + 0x10]; width
or edx, edx
jz Return
or ebx, ebx
jz Return
; Precalculate
mov [esp + 0x14], edx; height
lea esi, [ebx * 2]
mov eax, [ecx + 0x18]; sourcePitch
mov edx, [ecx + 0x1C]; destPitch
sub eax, ebx
sub edx, esi
mov [esp + 0xC], eax; sourcePitchDelta
mov [esp + 0x10], edx; destPitchDelta
; Cache values in registers
mov esi, [ecx] ; sourceImage*
mov edi, [ecx + 0x4]; destImage*
mov ebp, [ecx + 0x24]; palette16*
mov ecx, ebx ; width
xor eax, eax
DrawLine:
shr ecx, 1
jnc DrawPixelPair; ->
; Handle single pixel draw
lodsb
or al, al
jz SkipOddPixelDraw; ->
mov ax, [ebp + eax*2]
mov [edi], ax
SkipOddPixelDraw:
add edi, 2
; Make sure there are still pixel pairs left to draw
or ecx, ecx
jz DrawLineLoopEpilog; ->
DrawPixelPair:
lodsw
or ax, ax
jz NextOutputPosition; ->
or al, al
jz DrawPixel2 ; ->
or ah, ah
jz DrawPixel1 ; ->
; DrawBothPixels
movzx edx, ah
xor ah, ah
mov dx, [ebp + edx*2]; Palette lookup
mov ax, [ebp + eax*2]; Palette lookup
shl edx, 16
or eax, edx
stosd
xor eax, eax
dec ecx
jnz DrawPixelPair ; ->
jmp DrawLineLoopEpilog; ->
DrawPixel1:
; Draw first pixel
mov ax, [ebp + eax*2]; Palette lookup
mov [edi], ax ; Draw pixel
jmp NextOutputPosition; ->
DrawPixel2:
or ah, ah
jz NextOutputPosition; ->
movzx edx, ah
mov ax, [ebp + edx*2]; Palette lookup
mov [edi + 2], ax ; Draw pixel
NextOutputPosition:
add edi, 4
DrawPixelsLoopEpilog:
dec ecx
jnz DrawPixelPair ; ->
DrawLineLoopEpilog:
dec [esp + 0x14] ; height
jz Return
mov ecx, ebx ; width
add esi, [esp + 0xC]; sourcePitchDelta
add edi, [esp + 0x10]; destPitchDelta
jmp DrawLine
Return:
pop ebp
pop edi
pop esi
; pop ebx
add esp, 0xC
}
// About 10% faster
__asm
{
sub esp, 0x18
push ebx
push esi
push edi
push ebp
; Make sure we have something to draw
mov edx, [ecx + 0x14]; height
mov ebx, [ecx + 0x10]; width
or edx, edx
jz Return
or ebx, ebx
jz Return
; Precalculate
mov [esp + 0x18], edx; heightRemaining
lea esi, [ebx * 2]
mov eax, [ecx + 0x18]; sourcePitch
mov edx, [ecx + 0x1C]; destPitch
sub eax, ebx
sub edx, esi
mov [esp + 0x10], eax; sourcePitchDelta
mov [esp + 0x14], edx; destPitchDelta
; Cache values in registers
mov esi, [ecx] ; sourceImage*
mov edi, [ecx + 0x4]; destImage*
mov ebp, [ecx + 0x24]; palette16*
; Calculate number of leading pixels
mov ecx, esi
neg ecx
and ecx, 3 ; Number of pixels until an aligned boundary [0..3]
cmp ecx, ebx ; Check number of lead pixels against width
jbe SkipLeadPixelCap; ->
mov ecx, ebx ; Number of lead pixels is capped at width
SkipLeadPixelCap:
mov [esp + 0x1C], ecx; numLeadPixels
; Calculate number of tail pixels and middle DWORDs
sub ebx, ecx ; width - numLeadPixels
mov edx, ebx
and ebx, 3 ; numTailPixels
shr edx, 2 ; numMiddleDwords
mov [esp + 0x24], ebx; numTailPixels
mov [esp + 0x20], edx; numMiddleDwords
; Combine lead and tail pixels when numMiddleDwords is 0
jnz SkipCombineLeadAndTail
add ecx, edx
mov [esp + 0x1C], ecx; numLeadPixels
mov [esp + 0x24], 0 ; numTailPixels
SkipCombineLeadAndTail:
xor eax, eax
DrawLine:
; Get number of leading pixels
mov ecx, [esp + 0x1C]; numLeadPixels
or ecx, ecx
jz DrawAlignedPixels
DrawLeadPixelLoop:
; Draw single pixels up to an aligned boundary
lodsb
xor ah, ah
or al, al
jz SkipLeadPixelDraw
mov ax, [ebp + eax*2]; Palette lookup
;stosw ; Write pixel
mov [edi], ax
SkipLeadPixelDraw:
add edi, 2
dec ecx
jnz DrawLeadPixelLoop
DrawAlignedPixels:
; Get number of aligned pixels
mov ecx, [esp + 0x20]; numMiddleDwords
or ecx, ecx
jz DrawLineLoopEpilog
DrawPixelDword:
lodsd
; Check transparent pixel block
or eax, eax
jz SkipOverTransparentBlock
;or ax, ax
;jz DrawSecondPixelWord
; Draw first pixel word
or al, al
jz DrawFirstBlockSecondPixel
or ah, ah
jz DrawFirstBlockFirstPixel
; Draw both pixels in first block
movzx edx, ah
movzx ebx, al
mov dx, [ebp + edx*2]; Palette lookup
mov ax, [ebp + ebx*2]; Palette lookup
shl edx, 16
mov dx, ax
mov [edi], edx ; Write pixels
DrawSecondPixelWord:
add edi, 4
shr eax, 16
;or ax, ax
;jz DrawPixelDwordLoopEpilog
or al, al
jz DrawSecondBlockSecondPixel
or ah, ah
jz DrawSecondBlockFirstPixel
; Draw both pixels in second block
movzx edx, ah
movzx ebx, al
mov dx, [ebp + edx*2]; Palette lookup
mov ax, [ebp + ebx*2]; Palette lookup
shl edx, 16
or eax, edx
stosd
DrawPixelDwordLoopEpilog:
dec ecx
jnz DrawPixelDword ; ->
jmp DrawTailPixels ; ->
DrawFirstBlockSecondPixel:
or ah, ah
jz DrawSecondPixelWord
movzx edx, ah
mov ax, [ebp + edx*2]; Palette lookup
mov [edi + 2], ax
jmp DrawSecondPixelWord
DrawFirstBlockFirstPixel:
movzx ebx, al
mov ax, [ebp + ebx*2]; Palette lookup
mov [edi], ax
jmp DrawSecondPixelWord
DrawSecondBlockSecondPixel:
or ah, ah
jz SkipDrawSecondBlockSecondPixel
movzx edx, ah
mov ax, [ebp + edx*2]; Palette lookup
mov [edi + 2], ax
SkipDrawSecondBlockSecondPixel:
add edi, 4
jmp DrawPixelDwordLoopEpilog
DrawSecondBlockFirstPixel:
mov ax, [ebp + eax*2]; Palette lookup
mov [edi], ax
add edi, 4
jmp DrawPixelDwordLoopEpilog
SkipOverTransparentBlock:
add edi, 8
jmp DrawPixelDwordLoopEpilog
DrawTailPixels:
; Get number of tail pixels
mov ecx, [esp + 0x24]; numTailPixels
xor eax, eax
or ecx, ecx
jz DrawLineLoopEpilog
DrawTailPixelLoop:
; Draw single pixels until end of line
lodsb
xor ah, ah
or al, al
jz SkipTailPixelDraw
mov ax, [ebp + eax*2]; Palette lookup
;stosw ; Write pixel
mov [edi], ax
SkipTailPixelDraw:
add edi, 2
dec ecx
jnz DrawTailPixelLoop
DrawLineLoopEpilog:
; Increment pointers
add esi, [esp + 0x10]; sourcePitchDelta
add edi, [esp + 0x14]; destPitchDelta
; Decrement loop count
dec [esp + 0x18] ; heightRemaining
jnz DrawLine
Return:
pop ebp
pop edi
pop esi
pop ebx
add esp, 0x18
}
Not likely. At least not in it's current form. There is too little gain to justify it.Yeah, that's what I thought. I mean, how many people would this actually effect? I'd be surprised if anyone here was still playing OP2 on a Windows 95.
I suppose most people have faster computersWhen I made the Windows 95 comment, I was referring to how this change would only affect people with older, slower computers available when OP2 first came out in '97. I'd imagine most people no longer use those kinds of computers (assuming "computer rot" wouldn't have made them totally inoperable by now).