(mandelbrot) Improved speed
This commit is contained in:
parent
8ae1c191d7
commit
497b01fcfb
|
@ -1,4 +1,6 @@
|
||||||
( mandelbrot )
|
( mandelbrot.tal )
|
||||||
|
( )
|
||||||
|
( by alderwick and d_m )
|
||||||
|
|
||||||
%WIDTH { #02a0 }
|
%WIDTH { #02a0 }
|
||||||
%HEIGHT { #0200 }
|
%HEIGHT { #0200 }
|
||||||
|
@ -17,88 +19,106 @@
|
||||||
#0ff0 .System/g DEO2
|
#0ff0 .System/g DEO2
|
||||||
#00ff .System/b DEO2
|
#00ff .System/b DEO2
|
||||||
|
|
||||||
WIDTH .Screen/width DEO2 ( 640 )
|
( size )
|
||||||
HEIGHT .Screen/height DEO2 ( 480 )
|
WIDTH .Screen/width DEO2
|
||||||
|
HEIGHT .Screen/height DEO2
|
||||||
|
|
||||||
|
( run )
|
||||||
draw-mandel
|
draw-mandel
|
||||||
|
|
||||||
BRK
|
BRK
|
||||||
|
|
||||||
@draw-mandel ( -- )
|
( draw the mandelbrot set using 4.12 fixed point numbers )
|
||||||
|
@draw-mandel ( -> )
|
||||||
|
XMAX XMIN SUB2 WIDTH DIV2 ,&dx STR2 ( ; &dx<-{xmax-min}/width )
|
||||||
|
YMAX YMIN SUB2 HEIGHT DIV2 ,&dy STR2 ( ; &dy<-{ymax-ymin}/height )
|
||||||
|
[ LIT2 01 -Screen/auto ] DEO ( ; auto<-1 )
|
||||||
|
LIT2r 8000 ( [8000] )
|
||||||
|
YMAX YMIN ( ymax* ymin* [8000] )
|
||||||
|
&yloop ( ymax* y* [8000] )
|
||||||
|
XMAX XMIN ( ymax* y* xmax* xmin* [8000] )
|
||||||
|
&xloop ( ymax* y* xmax* x* [8000] )
|
||||||
|
ROT2k evaluate ( ymax* y* xmax* x* xmax* count^ [8000] )
|
||||||
|
.Screen/pixel DEO POP2 ( ymax* y* xmax* x* [8000] )
|
||||||
|
[ LIT2 &dx $2 ] ADD2 ( ymax* y* xmax* x+dx* [8000] )
|
||||||
|
OVR2 STH2kr ADD2 ( ymax* y* xmax* x+dx* 8000+xmax* [8000] )
|
||||||
|
OVR2 STH2kr ADD2 ( ymax* y* xmax* x+dx* 8000+xmax* 8000+x+dx* [8000] )
|
||||||
|
GTH2 ?&xloop ( ymax* y* xmax* x+dx* [8000] )
|
||||||
|
POP2 POP2 ( ymax* y* [8000] )
|
||||||
|
#0000 .Screen/x DEO2 ( ymax* y* [8000] ; sc/x<-0 )
|
||||||
|
.Screen/y DEI2k ( ymax* y* d^ sy* [8000] )
|
||||||
|
INC2 ROT DEO2 ( ymax* y* [8000] ; sc/y<-sy+1 )
|
||||||
|
[ LIT2 &dy $2 ] ADD2 ( ymax* y+dy* [8000] )
|
||||||
|
OVR2 STH2kr ADD2 ( ymax* y+dy* 8000+ymax* [8000] )
|
||||||
|
OVR2 STH2kr ADD2 ( ymax* y+dy* 8000+ymax* 8000+y+dy* [8000] )
|
||||||
|
GTH2 ?&yloop ( ymax* y+dy* [8000] )
|
||||||
|
POP2 POP2 POP2r JMP2r ( )
|
||||||
|
|
||||||
XMAX XMIN SUB2 WIDTH DIV2 ;&dx STA2
|
@evaluate ( x* y* -> count^ )
|
||||||
YMAX YMIN SUB2 HEIGHT DIV2 ;&dy STA2
|
#0000 DUP2 ,&x1 STR2 ( x* y* ; x1<-0 )
|
||||||
[ LIT2 01 -Screen/auto ] DEO
|
DUP2 ,&y1 STR2 ( x* y* ; y1<-0 )
|
||||||
YMAX YMIN
|
DUP2 ,&x2 STR2 ( x* y* ; x2<-0 )
|
||||||
&ver
|
,&y2 STR2 ( x* y* ; y2<-0 )
|
||||||
DUP2 ,&y STR2
|
LIT2r 2000 ( x* y* [20 00] )
|
||||||
XMAX XMIN
|
&loop ( x* y* [20 n^] )
|
||||||
&hor
|
[ LIT2 &x1 $2 ] ( x* y* x1* [20 n^] )
|
||||||
DUP2 ,&x STR2
|
[ LIT2 &y1 $2 ] ( x* y* x1* y1* [20 n^] )
|
||||||
#0000
|
smul2 DUP2 ADD2 ( x* y* 2x1y1* [20 n^] )
|
||||||
DUP2 ,&x1 STR2
|
OVR2 ADD2 ,&y1 STR2 ( x* y* [20 n^] ; y1<-2x1y1+y* )
|
||||||
DUP2 ,&y1 STR2
|
SWP2 [ LIT2 &x2 $2 ] ( y* x* x2* [20 n^] )
|
||||||
DUP2 ,&x2 STR2
|
[ LIT2 &y2 $2 ] SUB2 ( y* x* x2-y2* [20 n^] )
|
||||||
,&y2 STR2
|
OVR2 ADD2 ,&x1 STR2 SWP2 ( x* y* [20 n^] ; x1<-x2-y2+x* )
|
||||||
( pixel )
|
,&x1 LDR2 square ( x* y* x1^2* [20 n^] )
|
||||||
#2000
|
DUP2 ,&x2 STR2 ( x* y* x1^2* [20 n^] ; x2<-x1^2* )
|
||||||
&loop
|
,&y1 LDR2 square ( x* y* x1^2* y1^2* [20 n^] )
|
||||||
[ LIT2 &x1 $2 ] [ LIT2 &y1 $2 ] smul2 DUP2 ADD2
|
DUP2 ,&y2 STR2 ( x* y* x1^2* y1^2* [20 n^] ; y2<-y1^2* )
|
||||||
[ LIT2 &y $2 ] ADD2 ,&y1 STR2
|
ADD2 #4000 GTH2 ?&end ( x* y* [20 n^] )
|
||||||
[ LIT2 &x2 $2 ] [ LIT2 &y2 $2 ] SUB2
|
INCr GTHkr STHr ?&loop ( x* y* [20 n+1*] )
|
||||||
[ LIT2 &x $2 ] ADD2 ,&x1 STR2
|
&end ( x* y* [20 count^] )
|
||||||
,&x1 LDR2 DUP2 smul2
|
POP2 POP2 NIPr STHr JMP2r ( count^ )
|
||||||
DUP2 ,&x2 STR2
|
|
||||||
,&y1 LDR2 DUP2 smul2
|
|
||||||
DUP2 ,&y2 STR2
|
|
||||||
ADD2 #4000 GTH2 ?&end
|
|
||||||
INC GTHk ?&loop
|
|
||||||
&end
|
|
||||||
NIP .Screen/pixel DEO
|
|
||||||
( done. )
|
|
||||||
[ LIT2 &dx $2 ] ADD2 OVR2 #8000 ADD2 OVR2 #8000 ADD2 SWP2 LTH2 ?&hor
|
|
||||||
POP2 POP2
|
|
||||||
#0000 .Screen/x DEO2
|
|
||||||
.Screen/y DEI2k INC2 ROT DEO2
|
|
||||||
[ LIT2 &dy $2 ] ADD2 OVR2 #8000 ADD2 OVR2 #8000 ADD2 SWP2 LTH2 ?&ver
|
|
||||||
POP2 POP2
|
|
||||||
|
|
||||||
JMP2r
|
( multiply two signed 4.12 fixed point numbers )
|
||||||
|
@smul2 ( a* b* -> ab* )
|
||||||
|
LIT2r 0001 DUP2 #8000 LTH2 ?&bpos negate SWPr ( a* |b|* [sign*] )
|
||||||
|
&bpos SWP2 DUP2 #8000 LTH2 ?&apos negate SWPr ( |b|* |a|* [sign*] )
|
||||||
|
&apos smul2-pos STHr ?&abpos negate ( ab* [scrap^] )
|
||||||
|
&abpos POPr JMP2r ( ab* )
|
||||||
|
|
||||||
@smul2 ( a* b* -- c* )
|
( multiply two non-negative fixed point numbers )
|
||||||
LITr 00
|
( )
|
||||||
DUP2 #8000 LTH2 ?&b-positive
|
( a * b = {a0/16 + a1/4096} * {b0/16 + b1/4096} )
|
||||||
INCr DUP2k EOR2 SWP2 SUB2
|
( = a0b0/256 + a1b0/65536 + a0b1/65536 + a1b1/16777216 )
|
||||||
&b-positive
|
( = x + y + z + 0 ; the last term is too small to represent, i.e. zero )
|
||||||
SWP2
|
( )
|
||||||
DUP2 #8000 LTH2 ?&a-positive
|
( x = a0b0 << 4 )
|
||||||
INCr DUP2k EOR2 SWP2 SUB2
|
( y = a1b0 >> 4 )
|
||||||
&a-positive
|
( z = a0b1 >> 4 )
|
||||||
( ahi alo bhi blo )
|
@smul2-pos ( a* b* -> ab* )
|
||||||
LITr 00 STH ( ahi alo bhi / blo* )
|
aerate ROT2 aerate ( b0* b1* a0* a1* )
|
||||||
OVRr STH ( ahi alo / blo* bhi* )
|
STH2 ROT2k ( b0* b1* a0* b1* a0* b0* [a1*] )
|
||||||
OVRr STH ( ahi / blo* bhi* alo* )
|
STH2 MUL2r ( b0* b1* a0* b1* a0* [a1b0*] )
|
||||||
OVRr STH ( asign / blo* bhi* alo* ahi* )
|
MUL2 STH2 ADD2r ( b0* b1* a0* [a1b0+a0b1*] )
|
||||||
ROT2r MUL2kr STH2r ( asign ahi-bhi* / blo* alo* ahi* bhi* )
|
NIP2 MUL2 #07ff min #40 SFT2 ( a0b0* [y+z*] )
|
||||||
ROT2r MUL2kr STH2r ( asign ahi-bhi* alo-bhi* / blo* ahi* bhi* alo* )
|
STH2r #04 SFT2 ADD2 ( x* [y+z*] )
|
||||||
NIP2r ( asign ahi-bhi* alo-bhi* / blo* ahi* alo* )
|
#7fff !min ( ab* )
|
||||||
ROT2r MUL2kr STH2r ( asign ahi-bhi* alo-bhi* alo-blo* / ahi* alo* blo* )
|
|
||||||
ROT2r MUL2r STH2r POP2r ( asign ahi-bhi* alo-bhi* alo-blo* ahi-blo* )
|
|
||||||
SWP2 ( asign ahi-bhi* alo-bhi* ahi-blo* alo-blo* )
|
|
||||||
( 32-bit result is [ r3 r2 r1 r0 ] )
|
|
||||||
POP #00 SWP ( asign ahi-bhi* alo-bhi* ahi-blo* r21* )
|
|
||||||
( r21 max is 00fe, ahi-blo max is 7e81, max sum is 7f7f )
|
|
||||||
ADD2 ( asign ahi-bhi* alo-bhi* r21'* )
|
|
||||||
( r21' max is 7f7f, alo-bhi max is 7e81, max sum is fe00 )
|
|
||||||
ADD2 ( asign ahi-bhi* r21"* )
|
|
||||||
( The result we want is bits 27-12 due to the fixed point representation we use. )
|
|
||||||
#04 SFT2 SWP2 #07ff min #40 SFT2 ADD2
|
|
||||||
( saturate to +/-7.fff )
|
|
||||||
#7fff min
|
|
||||||
STHr #01 NEQ ?&result-positive
|
|
||||||
DUP2k EOR2 SWP2 SUB2
|
|
||||||
&result-positive
|
|
||||||
JMP2r
|
|
||||||
|
|
||||||
@min ( x* y* -- min* )
|
( equivalent to DUP2 smul2 but faster )
|
||||||
GTH2k [ JMP SWP2 NIP2 ] JMP2r
|
@square ( a* -> aa* )
|
||||||
|
DUP2 #8000 LTH2 ?&pos negate &pos
|
||||||
|
|
||||||
|
( >> )
|
||||||
|
|
||||||
|
( equivalent to DUP2 smul2-pos but faster )
|
||||||
|
@square-pos ( a* -> aa* )
|
||||||
|
aerate ( 00 ahi^ 00 alo^ )
|
||||||
|
OVR2 MUL2 #03 SFT2 SWP2 ( yz* ahi* )
|
||||||
|
DUP2 MUL2 #07ff min #40 SFT2 ( x* yz* )
|
||||||
|
ADD2 #7fff !min ( aa* )
|
||||||
|
|
||||||
|
( convert each byte of a a short into a short )
|
||||||
|
@aerate ( x* -> 00 xhi^ 00 xlo^ ) SWP #0000 ROT SWP2 SWP JMP2r
|
||||||
|
|
||||||
|
( negate a fixed point number. doesn't work for #8000 )
|
||||||
|
@negate ( x* -> -x* ) DUP2k EOR2 SWP2 SUB2 JMP2r
|
||||||
|
|
||||||
|
( return the minimum of two non-negative numbers. )
|
||||||
|
@min ( x* y* ) GTH2k [ JMP SWP2 ] NIP2 JMP2r
|
||||||
|
|
Loading…
Reference in New Issue