408 lines
10 KiB
Tal
408 lines
10 KiB
Tal
( math32.tal )
|
|
( )
|
|
( 32-bit integers are represented by two 16-bit integers )
|
|
( x** means xhi* xlo* )
|
|
|
|
%DEBUG { #ff #0e DEO }
|
|
%RTN { JMP2r }
|
|
%EMIT { #18 DEO }
|
|
%DIGIT { #00 SWP ;digits ADD2 LDA EMIT }
|
|
%SPACE { #20 EMIT }
|
|
%NEWLINE { #0a EMIT }
|
|
|
|
%TOR { ROT ROT }
|
|
%TOR2 { ROT2 ROT2 }
|
|
%POP4 { POP2 POP2 }
|
|
|
|
%X { #0000 #0001 }
|
|
%Y { #1234 #ffff }
|
|
%Z { #fedc #ba98 }
|
|
|
|
|0100
|
|
( run a bunch of test cases )
|
|
|
|
#1000 #03 ;divmod16-by-8 JSR2 ;emit-short-byte JSR2 NEWLINE
|
|
NEWLINE
|
|
|
|
#1124 #1244 #01 ;left-shift JSR2 ;emit-long JSR2 NEWLINE
|
|
#1124 #1244 #02 ;left-shift JSR2 ;emit-long JSR2 NEWLINE
|
|
#1124 #1244 #08 ;left-shift JSR2 ;emit-long JSR2 NEWLINE
|
|
#1124 #1244 #0f ;left-shift JSR2 ;emit-long JSR2 NEWLINE
|
|
#1124 #1244 #10 ;left-shift JSR2 ;emit-long JSR2 NEWLINE
|
|
#1124 #1244 #13 ;left-shift JSR2 ;emit-long JSR2 NEWLINE
|
|
#1124 #1244 #17 ;left-shift JSR2 ;emit-long JSR2 NEWLINE
|
|
#1124 #1244 #18 ;left-shift JSR2 ;emit-long JSR2 NEWLINE
|
|
#1124 #1244 #19 ;left-shift JSR2 ;emit-long JSR2 NEWLINE
|
|
#0000 #0001 #1f ;left-shift JSR2 ;emit-long JSR2 NEWLINE
|
|
#0000 #0001 #20 ;left-shift JSR2 ;emit-long JSR2 NEWLINE
|
|
NEWLINE
|
|
|
|
#0000 #0000 ;bitcount32 JSR2 ;emit-byte JSR2 NEWLINE
|
|
#0000 #0100 ;bitcount32 JSR2 ;emit-byte JSR2 NEWLINE
|
|
#0001 #0000 ;bitcount32 JSR2 ;emit-byte JSR2 NEWLINE
|
|
#0010 #0000 ;bitcount32 JSR2 ;emit-byte JSR2 NEWLINE
|
|
#1000 #0000 ;bitcount32 JSR2 ;emit-byte JSR2 NEWLINE
|
|
#f000 #0000 ;bitcount32 JSR2 ;emit-byte JSR2 NEWLINE
|
|
NEWLINE
|
|
|
|
#ffff #ffff #2a ;mul16 ;emit-short ;test16 JSR2
|
|
#0001 #ffff #2a ;mul16 ;emit-short ;test16 JSR2
|
|
#ffff #0001 #2a ;mul16 ;emit-short ;test16 JSR2
|
|
#00ff #0001 #2a ;mul16 ;emit-short ;test16 JSR2
|
|
NEWLINE
|
|
|
|
#ffff #ffff #ffff #ffff #2a ;mul32 ;emit-long ;test32 JSR2
|
|
#0000 #0001 #ffff #ffff #2a ;mul32 ;emit-long ;test32 JSR2
|
|
#0000 #0002 #0000 #ffff #2a ;mul32 ;emit-long ;test32 JSR2
|
|
#0001 #2345 #0034 #5678 #2a ;mul32 ;emit-long ;test32 JSR2
|
|
NEWLINE
|
|
|
|
X Y #2b ;add32 ;emit-long ;test32 JSR2
|
|
Z Y #2b ;add32 ;emit-long ;test32 JSR2
|
|
#fedc #0000 #1234 #0000 #2b ;add32 ;emit-long ;test32 JSR2
|
|
#fedc #0000 #0000 #0000 #2b ;add32 ;emit-long ;test32 JSR2
|
|
#0000 #0000 #0000 #0000 #2b ;add32 ;emit-long ;test32 JSR2
|
|
NEWLINE
|
|
|
|
#1234 #1234 #0000 #0001 #2d ;sub32 ;emit-long ;test32 JSR2
|
|
#1234 #1234 #0000 #1234 #2d ;sub32 ;emit-long ;test32 JSR2
|
|
#1234 #1234 #1234 #0001 #2d ;sub32 ;emit-long ;test32 JSR2
|
|
#1234 #1234 #1000 #0000 #2d ;sub32 ;emit-long ;test32 JSR2
|
|
#1234 #1234 #ffff #ffff #2d ;sub32 ;emit-long ;test32 JSR2
|
|
NEWLINE
|
|
|
|
X Y #26 ;and32 ;emit-long ;test32 JSR2
|
|
X Y #7c ;or32 ;emit-long ;test32 JSR2
|
|
X Y #5e ;xor32 ;emit-long ;test32 JSR2
|
|
X Y #3d ;eq32 ;emit-byte ;test32 JSR2
|
|
Y Y #3d ;eq32 ;emit-byte ;test32 JSR2
|
|
X Y #7e ;ne32 ;emit-byte ;test32 JSR2
|
|
X X #7e ;ne32 ;emit-byte ;test32 JSR2
|
|
BRK
|
|
|
|
@test16 ( x* y* symbol^ test-addr* emit-addr* -> )
|
|
,&emitaddr STR2
|
|
,&testaddr STR2
|
|
,&testsym STR
|
|
,&y STR2
|
|
,&x STR2
|
|
,&x LDR2 ;emit-short JSR2
|
|
SPACE ,&testsym LDR EMIT SPACE
|
|
,&y LDR2 ;emit-short JSR2
|
|
SPACE #3d EMIT SPACE
|
|
,&x LDR2 ,&y LDR2
|
|
,&testaddr LDR2 JSR2
|
|
,&emitaddr LDR2 JSR2 NEWLINE
|
|
RTN
|
|
&testsym $1
|
|
&testaddr $2
|
|
&emitaddr $2
|
|
&x $2 &y $2
|
|
|
|
@test32 ( x** y** symbol^ test-addr* emit-addr* -> )
|
|
,&emitaddr STR2
|
|
,&testaddr STR2
|
|
,&testsym STR
|
|
,&ylo STR2 ,&yhi STR2
|
|
,&xlo STR2 ,&xhi STR2
|
|
,&xhi LDR2 ,&xlo LDR2 ;emit-long JSR2
|
|
SPACE ,&testsym LDR EMIT SPACE
|
|
,&yhi LDR2 ,&ylo LDR2 ;emit-long JSR2
|
|
SPACE #3d EMIT SPACE
|
|
,&xhi LDR2 ,&xlo LDR2
|
|
,&yhi LDR2 ,&ylo LDR2
|
|
,&testaddr LDR2 JSR2
|
|
,&emitaddr LDR2 JSR2 NEWLINE
|
|
RTN
|
|
&testsym $1
|
|
&testaddr $2
|
|
&emitaddr $2
|
|
&xhi $2 &xlo $2
|
|
&yhi $2 &ylo $2
|
|
|
|
@bitcount8 ( x^ -> n^ )
|
|
#00 SWP ( n x )
|
|
&loop
|
|
DUP #00 EQU ( n x x=0 )
|
|
,&done JCN ( n x )
|
|
#01 SFT ( n x>>1 )
|
|
SWP INC SWP ( n+1 x>>1 )
|
|
,&loop JMP
|
|
&done
|
|
POP ( n )
|
|
RTN
|
|
|
|
@bitcount16 ( x* -> n^ )
|
|
SWP ( xlo xhi )
|
|
;bitcount8 JSR2 ( xlo nhi )
|
|
DUP #00 NEQ ( xlo nhi nhi!=0 )
|
|
,&hi-set JCN ( xlo nhi )
|
|
SWP ;bitcount8 JSR2 ADD ( nhi+nlo )
|
|
RTN
|
|
&hi-set
|
|
SWP POP #08 ADD ( nhi+8 )
|
|
RTN
|
|
|
|
@bitcount32 ( x** -> n^ )
|
|
SWP2 ( xlo* xhi* )
|
|
;bitcount16 JSR2 ( xlo* nhi )
|
|
DUP #00 NEQ ( xlo* nhi nhi!=0 )
|
|
,&hi-set JCN ( xlo* nhi )
|
|
TOR ;bitcount16 JSR2 ADD RTN ( nhi+nlo )
|
|
&hi-set
|
|
TOR POP2 #10 ADD ( nhi+16 )
|
|
RTN
|
|
|
|
@eq32 ( xhi* xlo* yhi* ylo* -> bool^ )
|
|
ROT2 EQU2 ,&maybe JCN
|
|
POP4 #00 RTN
|
|
&maybe EQU2
|
|
RTN
|
|
|
|
@eq-zero32 ( x** -> bool^ )
|
|
ORA2 #0000 EQU2
|
|
RTN
|
|
|
|
@ne32 ( xhi* xlo* yhi* ylo* -> bool^ )
|
|
ROT2 EQU2 ,&maybe JCN
|
|
POP4 #01 RTN
|
|
&maybe NEQ2
|
|
RTN
|
|
|
|
@ne-zero32 ( x** -> bool^ )
|
|
ORA2 #0000 NEQ2
|
|
RTN
|
|
|
|
@and32 ( xhi* xlo* yhi* ylo* -> xhi|yhi* xlo|ylo* )
|
|
ROT2 AND2 TOR2 AND2 SWP2
|
|
RTN
|
|
|
|
@or32 ( xhi* xlo* yhi* ylo* -> xhi|yhi* xlo|ylo* )
|
|
ROT2 ORA2 TOR2 ORA2 SWP2
|
|
RTN
|
|
|
|
@xor32 ( xhi* xlo* yhi* ylo* -> xhi|yhi* xlo|ylo* )
|
|
ROT2 EOR2 TOR2 EOR2 SWP2
|
|
RTN
|
|
|
|
%COMPLEMENT32 { SWP2 #ffff EOR2 SWP2 #ffff EOR2 }
|
|
|
|
@complement32 ( x** -> ~x** )
|
|
COMPLEMENT32
|
|
RTN
|
|
|
|
@negate32 ( x** -> -x** )
|
|
COMPLEMENT32
|
|
INC2 ( ~xhi -xlo )
|
|
DUP2 #0000 NEQ2 ( ~xhi -xlo non-zero? )
|
|
,&done JCN ( xlo non-zero => don't inc hi )
|
|
SWP2 INC2 SWP2 ( -xhi -xlo )
|
|
&done
|
|
RTN
|
|
|
|
@left-by-16 ( xhi* xlo* -> xlo* 0000 )
|
|
SWP2 POP2 #0000
|
|
RTN
|
|
|
|
@left-shift ( x** n^ -> x<<n )
|
|
DUP #08 LTH ;left-shift0 JCN2 ( x n )
|
|
DUP #10 LTH ;left-shift1 JCN2 ( x n )
|
|
DUP #18 LTH ;left-shift2 JCN2 ( x n )
|
|
;left-shift3 JMP2 ( x n )
|
|
RTN
|
|
[ &z0 $1 &z1 $1 &z2 $1 &z3 $1 ]
|
|
|
|
( shift left by 0-7 bits )
|
|
@left-shift0 ( x** n^ -> x<<n )
|
|
#40 SFT ,&r STR ( n<<4 -> r )
|
|
SWP SWP2 SWP ( x3 x2 x1 x0 )
|
|
|
|
,&r LDR SFT ,&z0 STR ( x3 x2 x1 )
|
|
|
|
#00 SWP ,&r LDR SFT2 ( x3 x2 00x1<<r )
|
|
,&z0 LDR2 ORA2 ,&z0 STR2 ( x3 x2 )
|
|
|
|
#00 SWP ,&r LDR SFT2 ( x3 00x2<<r )
|
|
,&z1 LDR2 ORA2 ,&z1 STR2 ( x3 )
|
|
|
|
#00 SWP ,&r LDR SFT2 ( 00x3<<r )
|
|
,&z2 LDR2 ORA2 ,&z2 STR2 ( )
|
|
|
|
,&z0 LDR2 ,&z2 LDR2
|
|
RTN
|
|
[ &r $1 &z0 $1 &z1 $1 &z2 $1 &z3 $1 ]
|
|
|
|
( shift left by 8-15 bits )
|
|
@left-shift1 ( x** n^ -> x<<n )
|
|
#08 SUB #40 SFT ,&r STR ( n<<4 -> r )
|
|
SWP SWP2 SWP POP ( x3 x2 x1 )
|
|
|
|
,&r LDR SFT ,&z0 STR ( x3 x2 )
|
|
|
|
#00 SWP ,&r LDR SFT2 ( x3 00x2<<r )
|
|
,&z0 LDR2 ORA2 ,&z0 STR2 ( x3 )
|
|
|
|
#00 SWP ,&r LDR SFT2 ( 00x3<<r )
|
|
,&z1 LDR2 ORA2 ,&z1 STR2 ( )
|
|
|
|
,&z0 LDR2 ,&z2 LDR #00
|
|
RTN
|
|
[ &r $1 &z0 $1 &z1 $1 &z2 $1 ]
|
|
|
|
( shift left by 16-23 bits )
|
|
@left-shift2 ( x** n^ -> x<<n )
|
|
#10 SUB #40 SFT ,&r STR ( n<<4 -> r )
|
|
SWP2 POP2 SWP ( x3 x2 )
|
|
|
|
,&r LDR SFT ,&z0 STR ( x3 )
|
|
|
|
#00 SWP ,&r LDR SFT2 ( x3<<r )
|
|
,&z0 LDR2 ORA2 ,&z0 STR2 ( )
|
|
|
|
,&z0 LDR2 #0000
|
|
RTN
|
|
[ &r $1 &z0 $1 &z1 $1 ]
|
|
|
|
( shift left by 24-31 bits )
|
|
@left-shift3 ( x** n^ -> x<<n )
|
|
#18 SUB #10 MUL ( x0 x1 x2 x3 r=[n-24]<<4 )
|
|
SFT ( x0 x1 x2 x3<<r )
|
|
SWP2 POP2 SWP POP #0000 #00
|
|
RTN
|
|
|
|
@add32 ( xhi* xlo* yhi* ylo* -> zhi* zlo* )
|
|
,&y2 STR2 ,&y0 STR2 ( save ylo, yhi )
|
|
,&x2 STR2 ,&x0 STR2 ( save xlo, xhi )
|
|
#0000 #0000 ,&z0 STR2 ,&z2 STR2 ( reset zhi, zlo )
|
|
|
|
( x3 + y3 => z2z3 )
|
|
#00 ,&x3 LDR #00 ,&y3 LDR ADD2 ,&z2 STR2
|
|
|
|
( x2 + y2 + z2 => z1z2 )
|
|
#00 ,&x2 LDR ,&z1 LDR2 ADD2 ,&z1 STR2
|
|
#00 ,&y2 LDR ,&z1 LDR2 ADD2 ,&z1 STR2
|
|
|
|
( x1 + y1 + z1 => z0z1 )
|
|
#00 ,&x1 LDR ,&z0 LDR2 ADD2 ,&z0 STR2
|
|
#00 ,&y1 LDR ,&z0 LDR2 ADD2 ,&z0 STR2
|
|
|
|
( x0 + y0 + z0 => z0 )
|
|
,&x0 LDR ,&z0 LDR ADD ,&z0 STR
|
|
,&y0 LDR ,&z0 LDR ADD ,&z0 STR
|
|
|
|
( load zhi,zlo )
|
|
,&z0 LDR2 ,&z2 LDR2
|
|
RTN
|
|
( registers for add32 )
|
|
[ &x0 $1 &x1 $1 &x2 $1 &x3 $1 ]
|
|
[ &y0 $1 &y1 $1 &y2 $1 &y3 $1 ]
|
|
[ &z0 $1 &z1 $1 &z2 $2 ]
|
|
|
|
@sub32 ( x** y** -> z** )
|
|
;negate32 JSR2 ;add32 JSR2
|
|
RTN
|
|
|
|
@mul16 ( x* y* -> z** )
|
|
,&y1 STR ,&y0 STR ( save ylo, yhi )
|
|
,&x1 STR ,&x0 STR ( save xlo, xhi )
|
|
#0000 #00 ,&z0 STR2 ,&z2 STR ( reset z0,z1,z2 )
|
|
#0000 #00 ,&a0 STR2 ,&a2 STR ( reset a0,a1,a2 )
|
|
|
|
( x1 * y1 => z1z2 )
|
|
#00 ,&x1 LDR #00 ,&y1 LDR MUL2 ,&z1 STR2
|
|
|
|
( x0 * y1 => z0z1 )
|
|
#00 ,&x0 LDR #00 ,&y1 LDR MUL2 ,&z0 LDR2 ADD2 ,&z0 STR2
|
|
|
|
( x1 * y0 => a1a2 )
|
|
#00 ,&x1 LDR #00 ,&y0 LDR MUL2 ,&a1 STR2
|
|
|
|
( x0 * y0 => a0a1 )
|
|
#00 ,&x0 LDR #00 ,&y0 LDR MUL2 ,&a0 LDR2 ADD2 ,&a0 STR2
|
|
|
|
( add z and a<<8 )
|
|
#00 ,&z0 LDR2 ,&z2 LDR
|
|
,&a0 LDR2 ,&a2 LDR #00
|
|
;add32 JSR2
|
|
RTN
|
|
[ &x0 $1 &x1 $1 ]
|
|
[ &y0 $1 &y1 $1 ]
|
|
[ &z0 $1 &z1 $1 &z2 $1 ]
|
|
[ &a0 $1 &a1 $1 &a2 $1 ]
|
|
|
|
@mul32 ( x** y** -> z** )
|
|
,&y1 STR2 ,&y0 STR2 ( save ylo, yhi )
|
|
,&x1 STR2 ,&x0 STR2 ( save xlo, xhi )
|
|
,&y1 LDR2 ,&x1 LDR2 ;mul16 JSR2 ( [x1*y1] )
|
|
,&z1 STR2 ,&z0 STR2 ( sum = x1*y1, save zlo, zhi )
|
|
|
|
,&y1 LDR2 ,&x0 LDR2 MUL2 ( [x0*y1]<<16 )
|
|
,&y0 LDR2 ,&x1 LDR2 MUL2 ( [x1*y0]<<16 )
|
|
( [x0*y0]<<32 will completely overflow )
|
|
ADD2 ,&z0 LDR2 ADD2 ( sum += x0*y1<<16 + x1*y0<<16 )
|
|
,&z1 LDR2
|
|
RTN
|
|
[ &x0 $2 &x1 $2 ]
|
|
[ &y0 $2 &y1 $2 ]
|
|
[ &z0 $2 &z1 $2 ]
|
|
|
|
@divmod32-by-32 ( x** y** -> q** r** )
|
|
,&div1 STR2 ,&div0 STR2 ( y -> div )
|
|
,&rem1 STR2 ,&rem0 STR2 ( x -> rem )
|
|
#0000 #0000 ,&quo1 STR2 ,&quo0 ( 0 -> quo )
|
|
,&rem0 LDR2 ,&rem1 LDR2 ;bitcount32 JSR2 ( rembits^ )
|
|
,&div1 LDR2 ,&div0 LDR2 ;bitcount32 JSR2 ( rembits^ divbits^ )
|
|
SUBk ,&shift STR ( rembits divbits )
|
|
,&div0 LDR2 ,&div1 LDR2
|
|
|
|
|
|
RTN
|
|
[ &div0 $2 &div1 $2
|
|
&rem0 $2 &rem1 $2
|
|
&quo0 $2 &quo1 $2
|
|
&shift $1 ]
|
|
|
|
@divmod16-by-8 ( x* y^ -> q* r^ )
|
|
DUP ,&y STR
|
|
ROT SWP ( x1 x0 y )
|
|
DIVk ( x1 x0 y q0 )
|
|
DUP ,&q0 STR ( x1 x0 y q0 )
|
|
MUL SUB ( x1 r=x0-y*q0 )
|
|
SWP #00 ,&y LDR ( r x1 00 y )
|
|
DIV2k ( rx1 00y q1 )
|
|
DUP2 ROT2 MUL2 ( rx1 q1 y*q1 )
|
|
ROT2 SWP2 SUB2 ( q1 rr=rx1-y*q1 )
|
|
SWP POP ( q1 rrlo )
|
|
ROT POP ( q1lo rrlo )
|
|
,&q0 LDR TOR
|
|
RTN
|
|
[ &y $1 &q0 $1 ]
|
|
|
|
@emit-long ( hi* lo* -> )
|
|
SWP2 ( lo* hi* )
|
|
;emit-short JSR2
|
|
;emit-short JSR2
|
|
RTN
|
|
|
|
%EMIT-BYTE { DUP #04 SFT DIGIT #0f AND DIGIT }
|
|
|
|
@emit-short-byte ( x* y^ - > )
|
|
TOR ( y^ x* )
|
|
;emit-short JSR2
|
|
SPACE
|
|
;emit-byte JSR2
|
|
RTN
|
|
|
|
@emit-short ( x* -> )
|
|
SWP ( lo^ hi^ )
|
|
EMIT-BYTE EMIT-BYTE
|
|
RTN
|
|
|
|
@emit-byte ( x^ -> )
|
|
EMIT-BYTE
|
|
RTN
|
|
|
|
@digits
|
|
30 31 32 33 34 35 36 37
|
|
38 39 61 62 63 64 65 66
|