uxn-utils/cli/lz/ulzenc.tal

170 lines
3.7 KiB
Tal
Raw Normal View History

2023-11-18 14:16:27 -05:00
( ulz encoder )
|10 @Console &vector $2 &read $1 &pad $5 &write $1 &err $1
|a0 @File &vector $2 &success $2 &stat $2 &delete $1 &append $1 &name $2 &length $2 &read $2 &write $2
|0000
@src $30
@dst $30
@ptr $1
2023-11-18 15:19:30 -05:00
@match-len $2
2023-11-18 16:22:25 -05:00
@output-ptr $2
@match-ctl $2
@dict-best $2
2023-11-18 17:09:09 -05:00
@combine $2
2023-11-18 16:22:25 -05:00
@dict $2
@dict-len $2
2023-11-18 14:16:27 -05:00
|0100
@ready-src ( -> )
;&await .Console/vector DEO2
BRK
&await ( -> )
.Console/read DEI .src skey ?ready-dst
BRK
@ready-dst ( -> )
;&await .Console/vector DEO2
BRK
&await ( -> )
.Console/read DEI .dst skey ?on-ready
BRK
@on-ready ( -> )
( | load raw )
;src .File/name DEO2
#4000 .File/length DEO2
;raw .File/read DEO2
;raw .File/success DEI2 uxn_lz_compress
2023-11-18 22:54:27 -05:00
( | write )
2023-11-18 22:45:01 -05:00
;dst .File/name DEO2
.output-ptr LDZ2 ;compressed SUB2 .File/length DEO2
;compressed .File/write DEO2
2023-11-18 14:16:27 -05:00
( halt ) #800f DEO
BRK
2023-11-18 15:19:30 -05:00
@<append-byte> ( byte -- )
.output-ptr LDZ2 INC2k .output-ptr STZ2 STA
JMP2r
2023-11-18 17:09:09 -05:00
@uxn_lz_compress ( input* length* -- )
2023-11-18 22:54:27 -05:00
( | fill variables )
2023-11-18 22:28:42 -05:00
;compressed .output-ptr STZ2
2023-11-18 17:09:09 -05:00
ADD2k NIP2 SWP2
2023-11-18 22:28:42 -05:00
&w ( end* start* -- )
2023-11-18 22:34:58 -05:00
EQU2k ?&end
2023-11-18 17:09:09 -05:00
( | get available dictionary size )
DUP2 ;raw SUB2 #0100 LTH2k ?{ SWP2 }
POP2 .dict-len STZ2
( | size of the string to search for )
SUB2k #3fff #0004 ADD2 LTH2k ?{ SWP2 }
POP2 ,&string-len STR2
( | itterate through the dictionary )
#0000 .match-len STZ2
DUP2 .dict-len LDZ2 SUB2 .dict STZ2
2023-11-18 22:28:42 -05:00
&for1 ( for ; dict_len; dict++, dict_len-- )
.dict-len LDZ2 #0000 EQU2 ?&end-for1
2023-11-18 17:09:09 -05:00
( Find common prefix length with the string )
#0000
2023-11-18 22:28:42 -05:00
&for2 ( for i = 0;; i++ )
2023-11-18 22:54:27 -05:00
( | If we reach the end of the string, it's the best possible match. )
2023-11-18 17:09:09 -05:00
DUP2 [ LIT2 &string-len $2 ] NEQ2 ?{
DUP2 .match-len STZ2
.dict LDZ2 .dict-best STZ2
2023-11-18 22:28:42 -05:00
POP2 !&done-search }
2023-11-18 22:54:27 -05:00
( | in[i] != dict[i % dict_len] break; )
2023-11-18 22:28:42 -05:00
( a ) ADD2k LDA STH
( b ) DUP2 .dict-len LDZ2 DIV2k MUL2 SUB2 .dict LDZ2 ADD2 LDA STHr
NEQ ?&end-for2
2023-11-18 17:09:09 -05:00
INC2 ORAk ?&for2
2023-11-18 22:28:42 -05:00
&end-for2
2023-11-18 22:54:27 -05:00
( | i > match_len )
2023-11-18 22:28:42 -05:00
DUP2 .match-len LDZ2 LTH2 ?{
2023-11-18 17:09:09 -05:00
DUP2 .match-len STZ2
.dict LDZ2 .dict-best STZ2 }
POP2
.dict LDZ2 INC2 .dict STZ2
2023-11-18 22:28:42 -05:00
.dict-len LDZ2 #0001 SUB2 .dict-len STZ2 !&for1
&end-for1
2023-11-18 17:09:09 -05:00
&done-search ( -- )
( CPY ) .match-len LDZ2 #0003 GTH2 ?op-cpy
2023-11-18 22:34:58 -05:00
( LIT ) !op-lit
&end
2023-11-18 22:54:27 -05:00
POP2 POP2
JMP2r
2023-11-18 17:09:09 -05:00
(
@|opcodes )
2023-11-18 16:14:23 -05:00
@op-cpy ( in* -- )
2023-11-18 22:54:27 -05:00
( | More numeric range: treat 0 as 4, 1 as 5, etc. )
2023-11-18 16:14:23 -05:00
.match-len LDZ2 #0004 SUB2 .match-ctl STZ2
2023-11-18 22:54:27 -05:00
( | CPY2 )
2023-11-18 16:14:23 -05:00
.match-ctl LDZ2 #003f GTH2 ?&cpy2
2023-11-18 22:54:27 -05:00
( | *output_ptr++ = match_ctl | 0x80; )
2023-11-18 22:45:01 -05:00
.match-ctl LDZ2 NIP #80 ORA <append-byte>
2023-11-18 16:14:23 -05:00
!&cpy-resume
2023-11-18 22:54:27 -05:00
&cpy2 ( -- )
2023-11-18 22:45:01 -05:00
.match-ctl LDZ2
2023-11-18 22:54:27 -05:00
SWP #c0 ORA <append-byte> <append-byte>
&cpy-resume ( -- )
( | *output_ptr++ = in - dict_best - 1; )
2023-11-18 22:45:01 -05:00
DUP2 .dict-best LDZ2 SUB2 #0001 SUB2 NIP <append-byte>
2023-11-18 22:54:27 -05:00
( | in += match_len; Advance input by size of the match )
2023-11-18 16:14:23 -05:00
.match-len LDZ2 ADD2
2023-11-18 22:54:27 -05:00
( | Disable combining previous literal, if any )
2023-11-18 16:14:23 -05:00
#0000 .combine STZ2
!uxn_lz_compress/w
@op-lit ( in* -- )
.combine LDZ2 ORA ?&combine
2023-11-18 22:54:27 -05:00
( | start a new literal )
( | Store this address, and later use it to increment the literal size. )
( | combine = output_ptr++; )
2023-11-18 16:14:23 -05:00
.output-ptr LDZ2
INC2k .output-ptr STZ2
.combine STZ2
2023-11-18 22:54:27 -05:00
( | *combine = 0; )
2023-11-18 16:14:23 -05:00
#00 .combine LDZ2 LDA2 STA
2023-11-18 22:54:27 -05:00
( | *output_ptr++ = *in++; )
2023-11-18 16:14:23 -05:00
LDAk <append-byte>
INC2 !uxn_lz_compress/w
&combine ( -- )
2023-11-18 22:54:27 -05:00
( | if ++*combine == 127 )
2023-11-18 16:14:23 -05:00
.combine LDZ2 LDA INC DUP #7f NEQ ?{ POP #00 }
.combine LDZ2 STA
LDAk <append-byte>
INC2 !uxn_lz_compress/w
2023-11-18 14:16:27 -05:00
(
@|stdlib )
@skey ( key buf -- proc )
OVR #21 LTH ?&eval
#00 SWP sput #00 JMP2r
&eval POP2 #01 JMP2r
@scap ( str* -- end* )
&w INC2 & LDAk ?&w
JMP2r
@sput ( chr str* -- )
scap/ INC2k #00 ROT ROT STA
STA
JMP2r
@getc ( -- b )
#0001 .File/length DEO2
;&b .File/read DEO2
[ LIT &b $1 ] JMP2r
(
@|memory )
@raw $4000
@compressed $4000