170 lines
3.5 KiB
Tal
170 lines
3.5 KiB
Tal
( ulz encoder )
|
|
|
|
|10 @Console &vector $2 &read $1 &pad $5 &write $1 &err $1
|
|
|a0 @File &vector $2 &success $2 &stat $2 &delete $1 &append $1 &name $2 &length $2 &read $2 &write $2
|
|
|
|
|0000
|
|
|
|
@src $30
|
|
@dst $30
|
|
@ptr $1
|
|
@match-len $2
|
|
@output-ptr $2
|
|
@match-ctl $2
|
|
@dict-best $2
|
|
@combine $2
|
|
@dict $2
|
|
@dict-len $2
|
|
|
|
|0100
|
|
|
|
@ready-src ( -> )
|
|
;&await .Console/vector DEO2
|
|
BRK
|
|
&await ( -> )
|
|
.Console/read DEI .src skey ?ready-dst
|
|
BRK
|
|
|
|
@ready-dst ( -> )
|
|
;&await .Console/vector DEO2
|
|
BRK
|
|
&await ( -> )
|
|
.Console/read DEI .dst skey ?on-ready
|
|
BRK
|
|
|
|
@on-ready ( -> )
|
|
( | load raw )
|
|
;src .File/name DEO2
|
|
#4000 .File/length DEO2
|
|
;raw .File/read DEO2
|
|
;raw .File/success DEI2 uxn_lz_compress
|
|
( halt ) #800f DEO
|
|
BRK
|
|
|
|
@<append-byte> ( byte -- )
|
|
.output-ptr LDZ2 INC2k .output-ptr STZ2 STA
|
|
JMP2r
|
|
|
|
@op-cpy ( in* -- )
|
|
( More numeric range: treat 0 as 4, 1 as 5, etc. )
|
|
.match-len LDZ2 #0004 SUB2 .match-ctl STZ2
|
|
( CPY2 )
|
|
.match-ctl LDZ2 #003f GTH2 ?&cpy2
|
|
( CPY1 )
|
|
( *output_ptr++ = match_ctl | 0x80; )
|
|
.match-ctl LDZ2 #0080 ORA2 <append-byte>
|
|
!&cpy-resume
|
|
&cpy2
|
|
( TODO )
|
|
&cpy-resume
|
|
( *output_ptr++ = in - dict_best - 1; )
|
|
DUP2 .dict-best LDZ2 #0001 SUB2 SUB2 <append-byte>
|
|
( in += match_len; Advance input by size of the match )
|
|
.match-len LDZ2 ADD2
|
|
( Disable combining previous literal, if any )
|
|
#0000 .combine STZ2
|
|
!uxn_lz_compress/w
|
|
|
|
@op-lit ( in* -- )
|
|
.combine LDZ2 ORA ?&combine
|
|
( start a new literal )
|
|
( Store this address, and later use it to increment the literal size. )
|
|
( combine = output_ptr++; )
|
|
.output-ptr LDZ2
|
|
INC2k .output-ptr STZ2
|
|
.combine STZ2
|
|
( *combine = 0; )
|
|
#00 .combine LDZ2 LDA2 STA
|
|
( *output_ptr++ = *in++; )
|
|
LDAk <append-byte>
|
|
INC2 !uxn_lz_compress/w
|
|
&combine ( -- )
|
|
( if ++*combine == 127 )
|
|
.combine LDZ2 LDA INC DUP #7f NEQ ?{ POP #00 }
|
|
.combine LDZ2 STA
|
|
LDAk <append-byte>
|
|
INC2 !uxn_lz_compress/w
|
|
|
|
@uxn_lz_compress ( input* length* -- )
|
|
ADD2k NIP2 SWP2
|
|
&w ( -- )
|
|
( | get available dictionary size )
|
|
DUP2 ;raw SUB2 #0100 LTH2k ?{ SWP2 }
|
|
POP2 .dict-len STZ2
|
|
( | size of the string to search for )
|
|
SUB2k #3fff #0004 ADD2 LTH2k ?{ SWP2 }
|
|
POP2 ,&string-len STR2
|
|
( | itterate through the dictionary )
|
|
#0000 .match-len STZ2
|
|
.dict-len LDZ2 SUB2k .dict STZ2
|
|
( | create a few inlines )
|
|
DUP2 ,&in STR2
|
|
&for1 ( dict-len != 0 )
|
|
( Find common prefix length with the string )
|
|
#0000
|
|
&for2 ( i != 0 )
|
|
( If we reach the end of the string, it's the best possible match. )
|
|
DUP2 [ LIT2 &string-len $2 ] NEQ2 ?{
|
|
DUP2 .match-len STZ2
|
|
.dict LDZ2 .dict-best STZ2
|
|
POP2 POP2 !&done-search }
|
|
( Dictionary repeats if we hit the end )
|
|
( in[i] != dict[i % dict_len] break; )
|
|
DUP2 [ LIT2 &in $2 ] ADD2 LDA2
|
|
OVR2 .dict-len LDZ2 DIV2k MUL2 SUB2
|
|
.dict LDZ2 ADD2 LDA2 NEQ2 ?&end
|
|
INC2 ORAk ?&for2
|
|
&end
|
|
( i > match_len )
|
|
DUP2 .match-len LDZ2 GTH2 #00 EQU ?{
|
|
DUP2 .match-len STZ2
|
|
.dict-len LDZ2 .dict STZ2 }
|
|
POP2
|
|
.dict LDZ2 INC2 .dict STZ2
|
|
#0001 SUB2 ORAk ?&for1
|
|
POP2
|
|
|
|
&done-search ( -- )
|
|
( CPY ) .match-len LDZ2 #0003 GTH2 ?op-cpy
|
|
( LIT ) op-lit
|
|
NEQ2k ?&w
|
|
JMP2r
|
|
|
|
(
|
|
@|stdlib )
|
|
|
|
@skey ( key buf -- proc )
|
|
OVR #21 LTH ?&eval
|
|
#00 SWP sput #00 JMP2r
|
|
&eval POP2 #01 JMP2r
|
|
|
|
@scap ( str* -- end* )
|
|
&w INC2 & LDAk ?&w
|
|
JMP2r
|
|
|
|
@sput ( chr str* -- )
|
|
scap/ INC2k #00 ROT ROT STA
|
|
STA
|
|
JMP2r
|
|
|
|
@getc ( -- b )
|
|
#0001 .File/length DEO2
|
|
;&b .File/read DEO2
|
|
[ LIT &b $1 ] JMP2r
|
|
|
|
@phex ( short* -- )
|
|
SWP phex/b
|
|
&b ( -- )
|
|
DUP #04 SFT phex/c
|
|
&c ( -- )
|
|
#0f AND DUP #09 GTH #27 MUL ADD [ LIT "0 ] ADD #18 DEO
|
|
JMP2r
|
|
|
|
(
|
|
@|memory )
|
|
|
|
@raw $4000
|
|
|
|
@compressed $4000
|
|
|