;THE COMPUTER CODE CONTAINED HEREIN IS THE SOLE PROPERTY OF PARALLAX ;SOFTWARE CORPORATION ("PARALLAX"). PARALLAX, IN DISTRIBUTING THE CODE TO ;END-USERS, AND SUBJECT TO ALL OF THE TERMS AND CONDITIONS HEREIN, GRANTS A ;ROYALTY-FREE, PERPETUAL LICENSE TO SUCH END-USERS FOR USE BY SUCH END-USERS ;IN USING, DISPLAYING, AND CREATING DERIVATIVE WORKS THEREOF, SO LONG AS ;SUCH USE, DISPLAY OR CREATION IS FOR NON-COMMERCIAL, ROYALTY OR REVENUE ;FREE PURPOSES. IN NO EVENT SHALL THE END-USER USE THE COMPUTER CODE ;CONTAINED HEREIN FOR REVENUE-BEARING PURPOSES. THE END-USER UNDERSTANDS ;AND AGREES TO THE TERMS HEREIN AND ACCEPTS THE SAME BY USE OF THIS FILE. ;COPYRIGHT 1993-1998 PARALLAX SOFTWARE CORPORATION. ALL RIGHTS RESERVED. ; ; $Source: f:/miner/source/texmap/rcs/tmap_per.asm $ ; $Revision: 1.18 $ ; $Author: mike $ ; $Date: 1994/05/03 11:08:32 $ ; ; Perspective texture mapper inner loop. ; ; $Log: tmap_per.asm $ ; Revision 1.18 1994/05/03 11:08:32 mike ; Trap divide overflows. ; ; Revision 1.17 1994/04/21 15:03:41 mike ; make faster. ; ; Revision 1.16 1994/04/08 16:46:57 john ; Made 32 fade levels. Hacked. ; ; Revision 1.15 1994/03/31 08:35:18 mike ; Fix quantized-by-4 bug in inner loop. ; ; Revision 1.14 1994/03/14 17:41:14 mike ; Fix bug in unlighted version. ; ; Revision 1.13 1994/03/14 15:45:14 mike ; streamline code. ; ; Revision 1.12 1994/01/14 14:01:58 mike ; *** empty log message *** ; ; Revision 1.11 1993/12/18 14:43:44 john ; Messed around with doing 1/z, the u*(1/z) and v*(1/z) ; (Went from 23 fps to 21 fps... not good! ) ; ; Revision 1.10 1993/12/17 16:14:17 john ; Split lighted/nonlighted, so there is no cmp lighting ; in the inner loop. ; ; Revision 1.9 1993/12/17 12:34:29 john ; Made leftover bytes use linear approx instead of correct... ; should save about 8 divides per scanline on average. ; Also, took out anti-aliasing code and rearranged to ; order of some instructions to help on 486 pipelining. ; (The anti-aliasing code did *not* look good, so I ; figure there was no reason to keep it in. ) ; ; Revision 1.8 1993/12/16 18:37:52 mike ; Align some stuff on 4 byte boundaries. ; ; Revision 1.7 1993/11/30 08:44:18 john ; Made selector set check for < 64*64 bitmaps. ; ; Revision 1.6 1993/11/23 17:25:26 john ; Added safety "and eax, 0fffh" in lighting lookup. ; ; Revision 1.5 1993/11/23 15:08:52 mike ; Fixed lighting bug. ; ; Revision 1.4 1993/11/23 14:38:50 john ; optimized NORMAL code by switching EBX and ESI, so BH can be used in ; the lighting process. ; ; Revision 1.3 1993/11/23 14:30:53 john ; Made the perspective tmapper do 1/8 divides; added lighting. ; ; Revision 1.2 1993/11/22 10:24:59 mike ; *** empty log message *** ; ; Revision 1.1 1993/09/08 17:29:53 mike ; Initial revision ; ; ; .386 public _fx_u,_fx_v,_fx_z,_fx_du_dx,_fx_dv_dx,_fx_dz_dx,_fx_y,_fx_xleft,_fx_xright public _pixptr public asm_tmap_scanline_per_ include tmap_inc.asm public _max_ecx,_min_ecx extern _fx_l:dword extern _fx_dl_dx:dword extern _dither_intensity_lighting:dword extern _Lighting_on:dword extern _pixel_data_selector:word, _gr_fade_table_selector:word, _transparency_on:dword _DATA SEGMENT DWORD PUBLIC USE32 'DATA' align 4 ;**_v_window_left dd _window_left ;**_v_window_right dd _window_right ;**_v_window_top dd _window_top ;**_v_window_bottom dd _window_bottom ; ---------- These are passed in by the C caller ---------- _fx_u dd ? _fx_v dd ? _fx_z dd ? _fx_du_dx dd ? _fx_dv_dx dd ? _fx_dz_dx dd ? _fx_y dd ? _fx_xleft dd ? _fx_xright dd ? _pixptr dd ? ; ----------^^ These are passed in by the C caller ^^---------- public _x,_loop_count align 4 _x dd ? _loop_count dd ? _max_ecx dd 0 _min_ecx dd 55555555h public _per2_flag _per2_flag dd 1 public _scan_doubling_flag, _linear_if_far_flag _scan_doubling_flag dd 0 _linear_if_far_flag dd 0 ;---------- local variables align 4 req_base dd ? req_size dd ? U0 dd ? U1 dd ? V0 dd ? V1 dd ? num_left_over dd ? DU1 dd ? DV1 dd ? DZ1 dd ? ;*NO_DITHER _fx_dl_dx1 dd ? ;*NO_DITHER _fx_dl_dx2 dd ? _DATA ENDS DGROUP GROUP _DATA _TEXT SEGMENT DWORD PUBLIC USE32 'CODE' ASSUME DS:_DATA ASSUME CS:_TEXT ; -------------------------------------------------------------------------------------------------- ; Enter: ; _xleft fixed point left x coordinate ; _xright fixed point right x coordinate ; _y fixed point y coordinate ; _pixptr address of source pixel map ; _u fixed point initial u coordinate ; _v fixed point initial v coordinate ; _z fixed point initial z coordinate ; _du_dx fixed point du/dx ; _dv_dx fixed point dv/dx ; _dz_dx fixed point dz/dx ; for (x = (int) xleft; x <= (int) xright; x++) { ; _setcolor(read_pixel_from_tmap(srcb,((int) (u/z)) & 63,((int) (v/z)) & 63)); ; _setpixel(x,y); ; ; u += du_dx; ; v += dv_dx; ; z += dz_dx; ; } asm_tmap_scanline_per_: push es push fs pusha ;---------------------------- setup for loop --------------------------------- ; Setup for loop: _loop_count iterations = (int) xright - (int) xleft ; esi source pixel pointer = pixptr ; edi initial row pointer = y*320+x ; set esi = pointer to start of texture map data mov es,_pixel_data_selector ; selector[0*2] mov fs,_gr_fade_table_selector ; selector[1*2] ; fs = bmd_fade_table ; set edi = address of first pixel to modify mov edi,_fx_y cmp edi,_window_bottom jae _none_to_do imul edi,_bytes_per_row mov eax,_fx_xleft sar eax,16 jns eax_ok sub eax,eax eax_ok: add edi,eax add edi,write_buffer ; set _loop_count = # of iterations mov eax,_fx_xright sar eax,16 cmp eax,_window_right jb eax_ok1 mov eax,_window_right eax_ok1: cmp eax,_window_left ja eax_ok2 mov eax,_window_left eax_ok2: mov ebx,_fx_xleft sar ebx,16 sub eax,ebx js _none_to_do cmp eax,_window_width jbe _ok_to_do mov eax,_window_width _ok_to_do: mov _loop_count,eax ; lighting values are passed in fixed point, but need to be in 8 bit integer, 8 bit fraction so we can easily ; get the integer by reading %bh sar _fx_l, 8 sar _fx_dl_dx,8 jns dl_dx_ok inc _fx_dl_dx ; round towards 0 for negative deltas dl_dx_ok: ;*NO_DITHER ;-------------------------- setup for dithering ----------------------------- ;*NO_DITHER ; do dithering, use lighting values which are .5 less than and .5 more than actual value ;*NO_DITHER mov ebx,40h ; assume dithering on ;*NO_DITHER mov eax,_fx_dl_dx ;*NO_DITHER add eax,ebx ; add 1/2 ;*NO_DITHER mov _fx_dl_dx1,eax ;*NO_DITHER mov eax,_fx_dl_dx ;*NO_DITHER sub eax,ebx ;*NO_DITHER mov _fx_dl_dx2,eax ;*NO_DITHER mov ebx,_fx_xleft ;*NO_DITHER shr ebx,16 ;*NO_DITHER xor ebx,_fx_y ;*NO_DITHER and ebx,1 ;*NO_DITHER jne dith_1 ;*NO_DITHER xchg eax,_fx_dl_dx1 ;*NO_DITHER dith_1: mov _fx_dl_dx2,eax ; set initial values mov ebx,_fx_u mov ebp,_fx_v mov ecx,_fx_z test _per2_flag,-1 je tmap_loop cmp _Lighting_on, 0 je tmap_loop_fast_nolight jmp tmap_loop_fast ;================ PERSPECTIVE TEXTURE MAP INNER LOOPS ======================== ; ; Usage in loop: eax division, pixel value ; ebx u ; ecx z ; edx division ; ebp v ; esi source pixel pointer ; edi destination pixel pointer ;-------------------- NORMAL PERSPECTIVE TEXTURE MAP LOOP ----------------- align 4 tmap_loop: xchg ebx, esi ; compute v coordinate mov eax,ebp ; get v cdq idiv ecx ; eax = (v/z) and eax,3fh ; mask with height-1 mov ebx,eax ; compute u coordinate mov eax,esi ; get u cdq idiv ecx ; eax = (u/z) shl eax,26 shld ebx,eax,6 ; esi = v*64+u ; read 1 pixel movzx eax,byte ptr es:[ebx] ; get pixel from source bitmap cmp _Lighting_on, 0 je NoLight1 ; LIGHTING CODE mov ebx, _fx_l ; get temp copy of lighting value mov ah, bh ; get lighting level add ebx, _fx_dl_dx ; update lighting value ;*NO_DITHER add ebx, _fx_dl_dx1 ; update lighting value ;*NO_DITHER and eax, (32*256)-1 ;*NO_DITHER push eax ; dithering ;*NO_DITHER mov eax, _fx_dl_dx2 ;*NO_DITHER xchg _fx_dl_dx1, eax ;*NO_DITHER mov _fx_dl_dx2, eax ;*NO_DITHER pop eax mov al, fs:[eax] ; xlat pixel thru lighting tables mov _fx_l, ebx ; save temp copy of lighting value ; transparency check NoLight1: cmp al,255 je skip1 mov [edi],al skip1: inc edi ; update deltas add ebp,_fx_dv_dx add esi,_fx_du_dx add ecx,_fx_dz_dx je _div_0_abort ; would be dividing by 0, so abort xchg esi, ebx dec _loop_count jns tmap_loop _none_to_do: popa pop fs pop es ret ; We detected a z=0 condition, which seems pretty bogus, don't you think? ; So, we abort, but maybe we want to know about it. _div_0_abort: ;** int 3 jmp _none_to_do ;-------------------------- PER/4 TMAPPER ---------------- ; ; x = x1 ; U0 = u/w; V0 = v/w; ; while ( 1 ) ; u += du_dx*4; v+= dv_dx*4 ; U1 = u/w; V1 = v/w; ; DUDX = (U1-U0)/4; DVDX = (V1-V0)/4; ; ; ; Pixel 0 ; pixels = texmap[V0*64+U0]; ; U0 += DUDX; V0 += DVDX ; ; Pixel 1 ; pixels = (pixels<<8)+texmap[V0*64+U0]; ; U0 += DUDX; V0 += DVDX ; ; Pixel 2 ; pixels = (pixels<<8)+texmap[V0*64+U0]; ; U0 += DUDX; V0 += DVDX ; ; Pixel 3 ; pixels = (pixels<<8)+texmap[V0*64+U0]; ; ; screen[x] = pixel ; x += 4; ; U0 = U1; V0 = V1 NBITS = 3 ZSHIFT = 3 PDIV MACRO ; Returns EAX/ECX in 16.16 format in EAX. Trashes EDX ; sig bits 6.3 ;--old-- cdq ;--old-- shld edx,eax, ZSHIFT ;--old-- lea eax, [eax*8] ;--old-- idiv ecx ; eax = (v/z) ;--old-- shl eax, 16-ZSHIFT mov edx,eax shl eax,ZSHIFT sar edx,32-ZSHIFT idiv ecx ; eax = (v/z) shl eax, 16-ZSHIFT ENDM wr_onepix macro num local skip cmp cl,255 je skip mov num[edi],cl ror ecx,8 skip: endm public tmap_loop_fast ; -------------------------------------- Start of Getting Dword Aligned ---------------------------------------------- ; ebx fx_u tmap_loop_fast: mov esi,ebx align 4 NotDwordAligned1: test edi, 11b jz DwordAligned1 ; compute v coordinate mov eax,ebp ; get v cdq idiv ecx ; eax = (v/z) and eax,3fh ; mask with height-1 mov ebx,eax ; compute u coordinate mov eax,esi ; get u cdq idiv ecx ; eax = (u/z) shl eax,26 shld ebx,eax,6 ; esi = v*64+u ; read 1 pixel movzx eax,byte ptr es:[ebx] ; get pixel from source bitmap ; lighting code mov ebx, _fx_l ; get temp copy of lighting value mov ah, bh ; get lighting level add ebx, _fx_dl_dx ; update lighting value mov _fx_l, ebx ; save temp copy of lighting value ; transparency check cmp al,255 je skip2 ; this pixel is transparent, so don't write it (or light it) mov al, fs:[eax] ; xlat pixel thru lighting tables ; write 1 pixel mov [edi],al skip2: inc edi ; update deltas add ebp,_fx_dv_dx add esi,_fx_du_dx add ecx,_fx_dz_dx je _div_0_abort ; would be dividing by 0, so abort dec _loop_count jns NotDwordAligned1 jmp _none_to_do ; -------------------------------------- End of Getting Dword Aligned ---------------------------------------------- DwordAligned1: mov ebx,esi ; get fx_u mov eax, _loop_count inc eax mov num_left_over, eax shr eax, NBITS cmp eax, 0 je tmap_loop mov _loop_count, eax ; _loop_count = pixels / NPIXS shl eax, 3 sub num_left_over, eax ; num_left_over = obvious ; compute initial v coordinate mov eax,ebp ; get v mov edx,ebp shl eax,ZSHIFT sar edx,32-ZSHIFT idiv ecx ; eax = (v/z) shl eax, 16-ZSHIFT mov V0, eax ; compute initial u coordinate mov eax,ebx ; get u mov edx,ebx shl eax,ZSHIFT sar edx,32-ZSHIFT idiv ecx ; eax = (v/z) shl eax, 16-ZSHIFT mov U0, eax ; Set deltas to NPIXS pixel increments mov eax, _fx_du_dx shl eax, 3 mov DU1, eax mov eax, _fx_dv_dx shl eax, 3 mov DV1, eax mov eax, _fx_dz_dx shl eax, 3 mov DZ1, eax align 4 TopOfLoop4: add ebx, DU1 add ebp, DV1 add ecx, DZ1 je _div_0_abort ; would be dividing by 0, so abort ; Done with ebx, ebp, ecx until next iteration push ebx push ecx push ebp push edi ; Find fixed U1 mov eax, ebx mov edx,ebx shl eax,ZSHIFT sar edx,32-ZSHIFT idiv ecx ; eax = (v/z) shl eax, 16-ZSHIFT mov ebx, eax ; ebx = U1 until pop's ; Find fixed V1 mov eax, ebp mov edx, ebp shl eax,ZSHIFT sar edx,32-ZSHIFT idiv ecx ; eax = (v/z) mov ecx, U0 ; ecx = U0 until pop's mov edi, V0 ; edi = V0 until pop's shl eax, 16-ZSHIFT mov ebp, eax ; ebp = V1 until pop's ; Make ESI = V0:U0 in 6:10,6:10 format mov eax, ecx shr eax, 6 mov esi, edi shl esi, 10 mov si, ax ; Make EDX = DV:DU in 6:10,6:10 format mov eax, ebx sub eax, ecx sar eax, NBITS+6 mov edx, ebp sub edx, edi shl edx, 10-NBITS ; EDX = V1-V0/ 4 in 6:10 int:frac mov dx, ax ; put delta u in low word ; Save the U1 and V1 so we don't have to divide on the next iteration mov U0, ebx mov V0, ebp pop edi ; Restore EDI before using it ; LIGHTING CODE mov ebx, _fx_l mov ebp, _fx_dl_dx test _transparency_on,-1 je no_trans1 REPT (1 SHL (NBITS-2)) local skip3,no_trans1 REPT 2 local skipa1,skipa2 mov eax, esi ; get u,v shr eax, 26 ; shift out all but int(v) shld ax,si,6 ; shift in u, shifting up v add esi, edx ; inc u,v mov al, es:[eax] ; get pixel from source bitmap cmp al,255 je skipa1 mov ah, bh ; form lighting table lookup value add ebx, ebp ; update lighting value mov al, fs:[eax] ; xlat thru lighting table into dest buffer mov [edi],al skipa1: inc edi ; Do odd pixel mov eax, esi ; get u,v shr eax, 26 ; shift out all but int(v) shld ax,si,6 ; shift in u, shifting up v add esi, edx ; inc u,v mov al, es:[eax] ; get pixel from source bitmap cmp al,255 je skipa2 mov ah, bh ; form lighting table lookup value add ebx, ebp ; update lighting value mov al, fs:[eax] ; xlat thru lighting table into dest buffer mov [edi],al skipa2: inc edi ENDM ENDM jmp cont1 ; ------------------------------------------------------- no_trans1: REPT (1 SHL (NBITS-2)) local skip3 REPT 2 mov eax, esi ; get u,v shr eax, 26 ; shift out all but int(v) shld ax,si,6 ; shift in u, shifting up v add esi, edx ; inc u,v mov al, es:[eax] ; get pixel from source bitmap mov ah, bh ; form lighting table lookup value add ebx, ebp ; update lighting value mov cl, fs:[eax] ; xlat thru lighting table into dest buffer ; Do odd pixel mov eax, esi ; get u,v shr eax, 26 ; shift out all but int(v) shld ax,si,6 ; shift in u, shifting up v add esi, edx ; inc u,v mov al, es:[eax] ; get pixel from source bitmap mov ah, bh ; form lighting table lookup value add ebx, ebp ; update lighting value mov ch, fs:[eax] ; xlat thru lighting table into dest buffer ror ecx, 16 ; move to next double dest pixel position ENDM mov [edi],ecx ; Draw 4 pixels to display skip3: add edi,4 ENDM cont1: ; ------------------------------------------------------- ; LIGHTING CODE mov _fx_l, ebx pop ebp pop ecx pop ebx dec _loop_count jnz TopOfLoop4 EndOfLoop4: cmp num_left_over, 0 je _none_to_do ; ----------------------------------------- Start of LeftOver Pixels ------------------------------------------ DoEndPixels: add ebx, DU1 add ebp, DV1 add ecx, DZ1 je _div_0_abort push edi ; use edi as a temporary variable cmp ecx,10 jg ecx_ok mov ecx,10 ecx_ok: ; Find fixed U1 mov eax, ebx PDIV mov ebx, eax ; ebx = U1 until pop's ; Find fixed V1 mov eax, ebp PDIV mov ebp, eax ; ebp = V1 until pop's mov ecx, U0 ; ecx = U0 until pop's mov edi, V0 ; edi = V0 until pop's ; Make ESI = V0:U0 in 6:10,6:10 format mov eax, ecx shr eax, 6 mov esi, edi shl esi, 10 mov si, ax ; Make EDX = DV:DU in 6:10,6:10 format mov eax, ebx sub eax, ecx sar eax, NBITS+6 mov edx, ebp sub edx, edi shl edx, 10-NBITS ; EDX = V1-V0/ 4 in 6:10 int:frac mov dx, ax ; put delta u in low word pop edi ; Restore EDI before using it mov ecx, num_left_over ; LIGHTING CODE mov ebx, _fx_l mov ebp, _fx_dl_dx ITERATION = 0 REPT (1 SHL (NBITS-1)) local skip4, skip5 ; Do even pixel mov eax, esi ; get u,v shr eax, 26 ; shift out all but int(v) shld ax,si,6 ; shift in u, shifting up v mov al, es:[eax] ; get pixel from source bitmap add esi, edx ; inc u,v mov ah, bh ; form lighting table lookup value ;SAFETYand ah,0fh add ebx, ebp ; update lighting value cmp al,255 je skip4 mov al, fs:[eax] ; xlat thru lighting table into dest buffer mov [edi+ITERATION], al ; write pixel skip4: dec ecx jz _none_to_do ITERATION = ITERATION + 1 ; Do odd pixel mov eax, esi ; get u,v shr eax, 26 ; shift out all but int(v) shld ax,si,6 ; shift in u, shifting up v mov al, es:[eax] ; get pixel from source bitmap add esi, edx ; inc u,v mov ah, bh ; form lighting table lookup value add ebx, _fx_dl_dx ; update lighting value cmp al,255 je skip5 ;SAFETYand ah,0fh mov al, fs:[eax] ; xlat thru lighting table into dest buffer mov [edi+ITERATION], al ; write pixel skip5: dec ecx jz _none_to_do ITERATION = ITERATION + 1 ENDM ; ----------------------------------------- End of LeftOver Pixels ------------------------------------------ ; Should never get here!!!! int 3 jmp _none_to_do ; ==================================================== No Lighting Code ====================================================== public tmap_loop_fast_nolight tmap_loop_fast_nolight: mov esi,ebx align 4 NotDwordAligned1_nolight: test edi, 11b jz DwordAligned1_nolight ; compute v coordinate mov eax,ebp ; get v cdq idiv ecx ; eax = (v/z) and eax,3fh ; mask with height-1 mov ebx,eax ; compute u coordinate mov eax,esi ; get u cdq idiv ecx ; eax = (u/z) shl eax,26 shld ebx,eax,6 ; esi = v*64+u ; read 1 pixel mov al,es:[ebx] ; get pixel from source bitmap ; write 1 pixel cmp al,255 je skip6 mov [edi],al skip6: inc edi ; update deltas add ebp,_fx_dv_dx add esi,_fx_du_dx add ecx,_fx_dz_dx je _div_0_abort ; would be dividing by 0, so abort dec _loop_count jns NotDwordAligned1_nolight jmp _none_to_do DwordAligned1_nolight: mov ebx,esi mov eax, _loop_count inc eax mov num_left_over, eax shr eax, NBITS cmp eax, 0 je tmap_loop mov _loop_count, eax ; _loop_count = pixels / NPIXS shl eax, NBITS sub num_left_over, eax ; num_left_over = obvious ; compute initial v coordinate mov eax,ebp ; get v PDIV mov V0, eax ; compute initial u coordinate mov eax,ebx ; get u PDIV mov U0, eax ; Set deltas to NPIXS pixel increments mov eax, _fx_du_dx shl eax, NBITS mov DU1, eax mov eax, _fx_dv_dx shl eax, NBITS mov DV1, eax mov eax, _fx_dz_dx shl eax, NBITS mov DZ1, eax align 4 TopOfLoop4_nolight: add ebx, DU1 add ebp, DV1 add ecx, DZ1 je _div_0_abort ; Done with ebx, ebp, ecx until next iteration push ebx push ecx push ebp push edi ; Find fixed U1 mov eax, ebx PDIV mov ebx, eax ; ebx = U1 until pop's ; Find fixed V1 mov eax, ebp PDIV mov ebp, eax ; ebp = V1 until pop's mov ecx, U0 ; ecx = U0 until pop's mov edi, V0 ; edi = V0 until pop's ; Make ESI = V0:U0 in 6:10,6:10 format mov eax, ecx shr eax, 6 mov esi, edi shl esi, 10 mov si, ax ; Make EDX = DV:DU in 6:10,6:10 format mov eax, ebx sub eax, ecx sar eax, NBITS+6 mov edx, ebp sub edx, edi shl edx, 10-NBITS ; EDX = V1-V0/ 4 in 6:10 int:frac mov dx, ax ; put delta u in low word ; Save the U1 and V1 so we don't have to divide on the next iteration mov U0, ebx mov V0, ebp pop edi ; Restore EDI before using it REPT (1 SHL (NBITS-2)) local skip7, no_trans2 REPT 4 ; Do 1 pixel mov eax, esi ; get u,v shr eax, 26 ; shift out all but int(v) shld ax,si,6 ; shift in u, shifting up v mov cl, es:[eax] ; load into buffer register add esi, edx ; inc u,v ror ecx, 8 ; move to next dest pixel ENDM test _transparency_on,-1 je no_trans2 cmp ecx,-1 je skip7 wr_onepix 0 wr_onepix 1 wr_onepix 2 wr_onepix 3 jmp skip7 no_trans2: mov [edi],ecx ; Draw 4 pixels to display skip7: add edi,4 ENDM pop ebp pop ecx pop ebx dec _loop_count jnz TopOfLoop4_nolight EndOfLoop4_nolight: cmp num_left_over, 0 je _none_to_do DoEndPixels_nolight: add ebx, DU1 add ebp, DV1 add ecx, DZ1 je _div_0_abort push edi ; use edi as a temporary variable ; Find fixed U1 mov eax, ebx PDIV mov ebx, eax ; ebx = U1 until pop's ; Find fixed V1 mov eax, ebp PDIV mov ebp, eax ; ebp = V1 until pop's mov ecx, U0 ; ecx = U0 until pop's mov edi, V0 ; edi = V0 until pop's ; Make ESI = V0:U0 in 6:10,6:10 format mov eax, ecx shr eax, 6 mov esi, edi shl esi, 10 mov si, ax ; Make EDX = DV:DU in 6:10,6:10 format mov eax, ebx sub eax, ecx sar eax, NBITS+6 mov edx, ebp sub edx, edi shl edx, 10-NBITS ; EDX = V1-V0/ 4 in 6:10 int:frac mov dx, ax ; put delta u in low word pop edi ; Restore EDI before using it mov ecx, num_left_over ITERATION = 0 REPT (1 SHL NBITS) local skip8 ; Do 1 pixel mov eax, esi ; get u,v shr eax, 26 ; shift out all but int(v) shld ax,si,6 ; shift in u, shifting up v mov al, es:[eax] ; load into buffer register add esi, edx ; inc u,v cmp al,255 je skip8 mov [edi+ITERATION], al ; write pixel skip8: dec ecx jz _none_to_do ITERATION = ITERATION + 1 ENDM ; Should never get here!!!!! int 3 jmp _none_to_do _TEXT ends end