440 lines
15 KiB
Tal
440 lines
15 KiB
Tal
( tal.tal )
|
|
( )
|
|
( by d_m )
|
|
( )
|
|
( see https://en.wikipedia.org/wiki/Tar_(computing)#UStar_format )
|
|
( )
|
|
( TODO: )
|
|
( - check for "ustar" header )
|
|
( - handle filename-prefix )
|
|
( - handle 'L' entries )
|
|
( - support creating archives )
|
|
( - arg validation should depend on mode )
|
|
( - validate checksums )
|
|
( - better error messages on unsupported files, e.g. symlinks )
|
|
( - better usage message )
|
|
( - support using "-" for stdin/stdout? )
|
|
( - option to ignore symlinks? )
|
|
|
|
( File1 is used to read/write the tar file )
|
|
( File2 is used to read/write files and directories )
|
|
|a0 @File1 [ &vec $2 &ok $2 &stat $2 &del $1 &append $1 &name $2 &len $2 &r $2 &w $2 ]
|
|
|b0 @File2 [ &vec $2 &ok $2 &stat $2 &del $1 &append $1 &name $2 &len $2 &r $2 &w $2 ]
|
|
|
|
|0100
|
|
;arg-callback ;on-stdin arg/init BRK
|
|
|
|
( exit abnormally )
|
|
@panic ( -> $exit )
|
|
#010e DEO #010f DEO BRK
|
|
|
|
( handle all provided command-line arguments )
|
|
@arg-callback ( -> )
|
|
;arg/count LDA
|
|
DUP #00 EQU ?&missing-mode
|
|
DUP #01 EQU ?&missing-file
|
|
#02 GTH ?&toomany !run
|
|
&missing-mode ;missing-mode !&error
|
|
&missing-file ;missing-filename !&error
|
|
&toomany ;too-many-arguments
|
|
&error print ;usage print #01 !exit
|
|
|
|
( run the program )
|
|
@run ( -> BRK )
|
|
#01 arg/read .File1/name DEO2
|
|
#00 arg/read LDA
|
|
DUP LIT "t NEQ ?{ list-entries #00 !exit }
|
|
DUP LIT "x NEQ ?{ expand-entries #00 !exit }
|
|
POP ;invalid-mode print ;usage print #00 !exit
|
|
|
|
( exit normally )
|
|
@exit ( code^ -> BRK )
|
|
#80 ORA #0f DEO BRK
|
|
|
|
( ignore stdin once we've processed the args )
|
|
@on-stdin ( -> BRK )
|
|
BRK
|
|
|
|
( print a null-terminated string )
|
|
@print ( s* -> )
|
|
&loop LDAk ?{ POP2 JMP2r }
|
|
LDAk #18 DEO INC2 !&loop
|
|
|
|
( print up to `len` bytes from string. stops on NUL. )
|
|
@lprint ( s* len* -> )
|
|
OVR2 ADD2 SWP2 ( limit* s* )
|
|
&loop LDAk ?{ !&done } ( limit* s* )
|
|
LDAk #18 DEO INC2 GTH2k ?&loop ( limit* s+1* )
|
|
&done POP2 POP2 JMP2r ( )
|
|
|
|
( read 512 bytes of header for the next tar entry. )
|
|
( assumes .File1/name is already set. )
|
|
@read-header ( -> ok^ )
|
|
#0200 .File1/len DEO2
|
|
;header .File1/r DEO2
|
|
( TODO validate checksum )
|
|
.File1/ok DEI2 #0200 EQU2 JMP2r
|
|
|
|
( list all the entries in the tar archive )
|
|
@list-entries ( -> )
|
|
read-header ?{ JMP2r }
|
|
;header/filename LDA ?&non-null
|
|
#800f DEO BRK
|
|
&non-null
|
|
;header/type LDA ( type^ )
|
|
DUP #00 EQU ?list-file ( type^ )
|
|
DUP LIT "0 EQU ?list-file ( type^ )
|
|
DUP LIT "5 EQU ?list-dir ( type^ )
|
|
DUP LIT "7 EQU ?list-file ( type^ )
|
|
DUP LIT "x EQU ?list-posix-meta ( type^ )
|
|
!list-unsupported
|
|
|
|
@list-posix-meta ( type^ -> )
|
|
POP
|
|
;header/size load-octal11 STH2 ( s0^ s1* [s2*] )
|
|
ORA ORA ?&meta-too-big
|
|
|
|
&meta-too-big
|
|
POP2r ;meta-too-big print
|
|
;header/size dump-longer #0a18 DEO
|
|
!list-unsupported
|
|
|
|
( verbose file entry listing )
|
|
@list-unsupported ( type^ -> )
|
|
;unsupported print
|
|
#18 DEO #2018 DEO
|
|
;header/size load-octal11 dump-longer #2018 DEO
|
|
;header/filename sanitize-path
|
|
#0064 lprint #0a18 DEO
|
|
;header/size load-octal11 round-up-to-512 skip !list-entries
|
|
|
|
( verbose file entry listing )
|
|
@list-file ( type^ -> )
|
|
POP
|
|
LIT "f #18 DEO #2018 DEO
|
|
;header/size load-octal11 dump-longer #2018 DEO
|
|
;header/filename #0064 lprint #0a18 DEO
|
|
;header/size load-octal11 round-up-to-512 skip !list-entries
|
|
|
|
( verbose directory entry listing )
|
|
@list-dir ( 00^ -> )
|
|
POP
|
|
LIT "d #18 DEO #2018 DEO
|
|
;header/size load-octal11 dump-longer #2018 DEO
|
|
;header/filename #0064 lprint #0a18 DEO
|
|
!list-entries
|
|
|
|
( expand a .tar archive in the current working directory )
|
|
@expand-entries ( -> )
|
|
read-header ?{ JMP2r }
|
|
;header/filename LDA ?&non-null
|
|
#800f DEO BRK
|
|
&non-null
|
|
;header/type LDA ( type^ )
|
|
DUP #00 EQU ?expand-file ( type^ )
|
|
DUP LIT "0 EQU ?expand-file ( type^ )
|
|
DUP LIT "5 EQU ?expand-dir ( type^ )
|
|
DUP LIT "7 EQU ?expand-file ( type^ )
|
|
!expand-unsupported
|
|
|
|
( remove leading / of an absolute path )
|
|
@sanitize-path ( s* -> s1* )
|
|
LDAk LIT "/ NEQ JMP INC2 JMP2r
|
|
|
|
@remainder-512 ( n* -> extra* )
|
|
#01ff AND2 #0200 DUP2 ROT2 SUB2 NEQ2k ?{ POP2 #0000 } NIP2 JMP2r
|
|
|
|
@expand-file ( type^ -> )
|
|
POP
|
|
;header/filename sanitize-path
|
|
DUP2 #0064 lprint #0a18 DEO
|
|
.File2/name DEO2
|
|
;header/size load-octal11 STH2k write
|
|
STH2r remainder-512 skip-lo !expand-entries
|
|
|
|
@expand-dir ( type^ -> )
|
|
POP
|
|
;header/filename sanitize-path
|
|
DUP2 #0064 lprint #0a18 DEO
|
|
.File2/name DEO2
|
|
#0004 .File2/len DEO2
|
|
#0001 .File2/w DEO2
|
|
!expand-entries
|
|
|
|
@expand-unsupported ( type^ -> )
|
|
;unsupported print
|
|
#18 DEO LIT2 ": 18 DEO #2018 DEO
|
|
;header/filename sanitize-path
|
|
#0064 lprint #0a18 DEO
|
|
;header/size load-octal11 round-up-to-512 skip !expand-entries
|
|
|
|
( src and dst should be paths )
|
|
@compress-entries ( src* dst* -> )
|
|
POP2 POP2 JMP2r
|
|
|
|
( writes `n` bytes from File1 to File2 )
|
|
( uses a 32k internal buffer )
|
|
@write ( carry^ hi* lo* -> )
|
|
;write-buf ;write-lo/writer STA2
|
|
write-lo write-hi ?write-4g JMP2r
|
|
|
|
( writes up to 32768 bytes of; limited by the size of buf )
|
|
@write-buf ( n* -> )
|
|
ORAk ?{ POP2 JMP2r } ( n* )
|
|
DUP2 .File1/len DEO2 ( n* )
|
|
;buffer .File1/r DEO2 ( n* )
|
|
DUP2 .File1/ok DEI2 EQU2 ?&ok ( n* )
|
|
POP2 ;read-error print !panic ( )
|
|
&ok ( n* )
|
|
DUP2 .File2/len DEO2 ( n* )
|
|
;buffer .File2/w DEO2 ( n* )
|
|
.File2/ok DEI2 EQU2 ?&ok2 ( )
|
|
;write-error print !panic ( )
|
|
&ok2 JMP2r ( )
|
|
|
|
( skips `n` bytes forward in File1, specified as a 5-byte integer )
|
|
( )
|
|
( since we can only actually read 32k at a time, and since we can )
|
|
( only easily work with 2-byte shorts, we first read the lowest )
|
|
( two bytes and skip that much. then, for the higher byte, we can )
|
|
( do two skips of 32k for each unit found. )
|
|
@skip ( carry^ hi* lo* -> )
|
|
;skip-buf ;write-lo/writer STA2
|
|
write-lo write-hi ?write-4g JMP2r
|
|
|
|
@skip-lo ( lo* -> )
|
|
;skip-buf ;write-lo/writer STA2 !write-lo
|
|
|
|
( skips up to 32768 bytes of; limited by the size of buf )
|
|
@skip-buf ( n* -> )
|
|
ORAk ?{ POP2 JMP2r }
|
|
DUP2 .File1/len DEO2
|
|
;buffer .File1/r DEO2
|
|
.File1/ok DEI2 EQU2 ?&ok
|
|
;read-error print !panic
|
|
&ok JMP2r
|
|
|
|
( unconditionally write 4GiB, that is 4294967296 bytes )
|
|
@write-4g ( -> ) write-2g ( >> )
|
|
|
|
( unconditionally write 2GiB, that is 2147483648 bytes )
|
|
@write-2g ( -> ) #8000 !write-hi
|
|
|
|
( writes `hi*65536` bytes )
|
|
( - 0001 will write 65536 bytes )
|
|
( - 0010 will write 1048576 bytes )
|
|
( - ffff will write 4294901760 bytes )
|
|
@write-hi ( hi* -> )
|
|
#0000 SWP2 SUB2 ( -hi* )
|
|
&loop ORAk ?&ok POP2 JMP2r ( )
|
|
&ok write-64k INC2 !&loop ( -hi+1* )
|
|
|
|
( writes exactly 65536 bytes )
|
|
@write-64k ( -> ) write-32k ( >> )
|
|
|
|
( writes exactly 32768 bytes )
|
|
@write-32k ( -> ) #8000 ( >> )
|
|
|
|
( write up to 65536 bytes )
|
|
@write-lo ( lo* -> )
|
|
DUP2 #8001 LTH2 ?{ write-32k #8000 SUB2 } LIT2 [ &writer =write-buf ] JMP2
|
|
|
|
( '0' -> 00 )
|
|
( '1' -> 01 )
|
|
( ... )
|
|
( '7' -> 07 )
|
|
( anything else -> 00 )
|
|
@octal-digit ( char^ -> oct^ )
|
|
LIT "0 SUB DUP #08 LTH ?{ POP #00 } JMP2r
|
|
|
|
( returns values between #00:0000:0000 and #01:ffff:ffff )
|
|
( )
|
|
( octal11 of 77777777777 = #01 #ffff #ffff, max value )
|
|
( octal11 of 37777777777 = #00 #ffff #ffff )
|
|
( octal11 of 00000177777 = #00 #0000 #ffff )
|
|
( octal11 of 00000000377 = #00 #0000 #00ff )
|
|
( octal11 of 00000000000 = #00 #0000 #0000, min value )
|
|
@load-octal11 ( addr* -> carry^ hi* lo* )
|
|
INC2k load-octal10 ( addr* hi* lo* ; load addr+1 )
|
|
STH2 STH2 ( addr* [lo* hi*] )
|
|
LDA octal-digit STH2r STH ( octal^ a^ [lo* b^] )
|
|
#20 SFT #02 SFT2 STHr STH2r ( carry^ hi* lo* )
|
|
JMP2r ( carry^ hi* lo* )
|
|
|
|
( returns values between #0000:0000 and #3fff:ffff )
|
|
( )
|
|
( octal10 of 7777777777 = #3fff #ffff, max value )
|
|
( octal10 of 0000177777 = #0000 #ffff )
|
|
( octal10 of 0000000377 = #0000 #00ff )
|
|
( octal10 of 0000000000 = #0000 #0000, min value )
|
|
@load-octal10 ( addr* -> hi* lo* )
|
|
#0005 OVR2 ADD2 ( addr* addr+5* )
|
|
load-octal5 STH2 ( addr* [cd*] )
|
|
load-octal5 SWPr STHr ( ab* c^ [d^] )
|
|
#10 SFT #01 SFT2 STH SWPr ( a^ b>>1^ [lo*] )
|
|
#10 SFT #01 SFT2 STH2r ( hi* lo* )
|
|
JMP2r ( hi* lo* )
|
|
|
|
( returns values between #0000 and #7fff )
|
|
( )
|
|
( octal5 of 77777 = #7fff, max value )
|
|
( octal5 of 00377 = #00ff )
|
|
( octal5 of 00000 = #0000, min value )
|
|
@load-octal5 ( addr* -> num* )
|
|
#1000 LIT2r 0000 ( addr* place* [sum*] )
|
|
&loop ( pos* place* [sum*] )
|
|
OVR2 LDA octal-digit ( addr* place* digit^ [sum*] )
|
|
#00 SWP ( addr* place* digit* [sum*] )
|
|
OVR2 MUL2 STH2 ADD2r ( addr* place* [sum2=sum+place*digit*] )
|
|
SWP2 INC2 SWP2 ( addr+1* place* [sum2*] )
|
|
#03 SFT2 ORAk ?&loop ( addr+1* place>>3* [sum2*] )
|
|
POP2 POP2 STH2r JMP2r ( sum2* )
|
|
|
|
( emit 1, 2, 4, or 5 bytes as a decimal number )
|
|
( @emit
|
|
&1+long STH2 STH2 /byte STH2r STH2r
|
|
&long SWP2 /short
|
|
&short SWP /byte
|
|
&byte DUP #04 SFT /char
|
|
&char #0f AND DUP #09 GTH #27 MUL ADD #30 ADD #18 DEO
|
|
JMP2r )
|
|
|
|
( round a given 5-byte size up to multiples of 512 )
|
|
@round-up-to-512 ( carry^ hi* lo* -> chl^** )
|
|
DUP2 #01ff AND2 ORA ?{ JMP2r }
|
|
DUP2 #fe00 GTH2 ?{ #0200 OVR2 #01ff AND2 SUB2 ADD2 JMP2r }
|
|
POP2 DUP2 #ffff EQU2 ?{ INC2 #0000 JMP2r }
|
|
POP2 INC #0000 #0000 JMP2r
|
|
|
|
( since 4-byte integers are called `long` values, )
|
|
( i'm calling a 5-byte integer a `longer` value. )
|
|
|
|
@dump-longer ( carry^ long** -- )
|
|
STH2 STH2 dump-byte STH2r STH2r ( >> )
|
|
@dump-long ( long** -- )
|
|
SWP2 dump-short ( >> )
|
|
@dump-short ( short* -- )
|
|
SWP dump-byte ( >> )
|
|
@dump-byte ( byte^ -- )
|
|
DUP #04 SFT /hex #0f AND ( >> )
|
|
&hex #30 ADD DUP #39 GTH #27 MUL ADD #18 DEO
|
|
JMP2r
|
|
|
|
@dump-mem ( start* size* -> )
|
|
OVR2 ADD2 SWP2 ( lim* start* )
|
|
LDAk dump-byte INC2 ( lim* start+1* )
|
|
&loop GTH2k ?&ok POP2 POP2 #0a18 DEO JMP2r ( lim^ pos^ )
|
|
&ok #2018 DEO LDAk dump-byte INC2 !&loop ( lim^ pos+1^ )
|
|
|
|
@dump-header ( -> )
|
|
LIT2 "- 18 DEOk DEOk DEOk DEOk DEO #0a18 DEO
|
|
;header/filename #0064 dump-mem
|
|
;header/mode #0008 dump-mem
|
|
;header/owner #0008 dump-mem
|
|
;header/group #0008 dump-mem
|
|
;header/size #000c dump-mem
|
|
;header/mtime #000c dump-mem
|
|
;header/checksum #0008 dump-mem
|
|
;header/type #0001 dump-mem
|
|
;header/linkname #0064 dump-mem
|
|
LIT2 "+ 18 DEOk DEOk DEOk DEOk DEO #0a18 DEO
|
|
;uheader/ustar #0006 dump-mem
|
|
;uheader/version #0002 dump-mem
|
|
;uheader/owner-name #0020 dump-mem
|
|
;uheader/group-name #0020 dump-mem
|
|
;uheader/major #0008 dump-mem
|
|
;uheader/minor #0008 dump-mem
|
|
;uheader/filename-prefix #009b dump-mem
|
|
;uheader/pad #000c dump-mem
|
|
LIT2 "- 18 DEOk DEOk DEOk DEOk DEO #0a18 DEO
|
|
JMP2r
|
|
|
|
( some handy string constants )
|
|
@usage "usage: 20 "uxncli 20 "tar.rom 20 "t|x 20 "FILENAME 0a 00
|
|
@missing-mode "error: 20 "missing 20 "mode 0a 00
|
|
@missing-filename "error: 20 "missing 20 "filename 0a 00
|
|
@too-many-arguments "error: 20 "too 20 "many 20 "arguments 0a 00
|
|
@invalid-mode "error: 20 "invalid 20 "mode 0a 00
|
|
@read-error "error 20 "reading 20 "data 0a 00
|
|
@write-error "error 20 "writing 20 "data 0a 00
|
|
@unsupported "skipped 20 "unsupported 20 "type 20 00
|
|
@meta-too-big "extended 20 "metadata 20 "field 20 "too 20 "big: 20 00
|
|
|
|
( load argument parser )
|
|
~arg.tal
|
|
|
|
( HEADER DETAILS )
|
|
( )
|
|
( header -- basic v7 tar header )
|
|
( /filename - name of file, null-terminated. if ustar, check prefix )
|
|
( /mode - file permissions, ignored by uxn )
|
|
( /owner - owner ID, ignored by uxn )
|
|
( /group - group ID, ignored by uxn )
|
|
( /size - file size as 11 octal digits. max size is 8GiB. )
|
|
( /mtime - last modification time, ignored by uxn )
|
|
( /checksum - 6 octal digits followed by NUL, then space )
|
|
( /type -- only 0, 5, and 7 are supported )
|
|
( '0' [or NUL] normal file )
|
|
( '1' hard link )
|
|
( '2' symlink )
|
|
( '3' character device )
|
|
( '4' block device )
|
|
( '5' directory )
|
|
( '6' fifo )
|
|
( '7' contiguous file -- treat as normal file )
|
|
( 'g' global extended header with metadata; POSIX.1-2001 )
|
|
( 'x' extended header with metadata for next file; POSIX.1-2001 )
|
|
( 'A' solaris ACL )
|
|
( 'D' gnu dump dir )
|
|
( 'E' solaris extended attrs )
|
|
( 'I' inode metadata )
|
|
( 'K' this entry's data is the long link location of next file, null-terminated? )
|
|
( 'L' this entry's data is the long filename of next file, null-terminated )
|
|
( 'M' continuation file )
|
|
( 'N' old gnu for long names )
|
|
( 'S' sparse files )
|
|
( 'V' tape/volume header )
|
|
( 'X' extended attrs, sun )
|
|
( /linkname -- for hardlinks, the file containing the linked data )
|
|
( uheader -- ustar header, found in v7 padding bytes )
|
|
( /ustar -- ustar indiciator, should be "ustar " )
|
|
( /version -- ustar version )
|
|
( /owner-name -- owner name string, ignored by uxn )
|
|
( /group-name -- group name string, ignored by uxn )
|
|
( /major -- major device number, ignored by uxn )
|
|
( /minor -- minor device number, ignored by uxn )
|
|
( /filename-prefix -- if non-null, true path is prefix+"/"+filename )
|
|
( )
|
|
( the v7 header is always 512 bytes even if ustar indicator is absent. )
|
|
|
|
@header
|
|
&filename $64 ( 0x00: filename, string, 100 byte )
|
|
&mode $8 ( 0x64: mode, octal-1, 8 bytes )
|
|
&owner $8 ( 0x6c: owner, octal-1, 8 bytes )
|
|
&group $8 ( 0x74: group, octal-1, 8 bytes )
|
|
&size $c ( 0x7c: size, octal-1, 12 bytes )
|
|
&mtime $c ( 0x88: mtime, octal-1, 12 bytes )
|
|
&checksum $8 ( 0x94: checksum, octal-2, 8 bytes )
|
|
&type $1 ( 0x9c: file type, 1 byte )
|
|
&linkname $64 ( 0x9d: linked filename, string, 100 bytes )
|
|
( >> )
|
|
@uheader
|
|
&ustar $6 ( 0x101: ustar indicator, non-terminated string, 6 bytes, "ustar " )
|
|
&version $2 ( 0x107: ustar version, non-terminated string, 2 bytes )
|
|
&owner-name $20 ( 0x109: owner name, string, 32 bytes )
|
|
&group-name $20 ( 0x129: group name, string, 32 bytes )
|
|
&major $8 ( 0x149: device major number, octal? )
|
|
&minor $8 ( 0x151: device minor number, octal? )
|
|
&filename-prefix $9b ( 0x159: prefix before filename, string, 155 bytes )
|
|
&pad $c ( 0x1f4: padding, 12 bytes )
|
|
&end ( 0x200: end of header )
|
|
|
|
( up to 8 bytes for long size )
|
|
|77f8 @long-size $8
|
|
|
|
( buffer for up to 2048 characters of long names/paths )
|
|
|7800 @long-buf $800
|
|
|
|
( buffer for reading up to 32k bytes of data at a time )
|
|
|8000 @buffer $8000
|