1 ! Copyright (C) 2009 Doug Coleman.
2 ! See http://factorcode.org/license.txt for BSD license.
3 USING: accessors byte-arrays combinators io io.backend
4 io.directories io.encodings.binary io.files io.files.links
5 io.pathnames io.streams.byte-array io.streams.string kernel
6 math math.parser namespaces sequences strings summary
10 CONSTANT: zero-checksum 256
11 CONSTANT: block-size 512
15 : save-link ( link -- )
18 TUPLE: tar-header name mode uid gid size mtime checksum typeflag
19 linkname magic version uname gname devmajor devminor prefix ;
21 ERROR: checksum-error header ;
23 : trim-string ( seq -- newseq ) [ "\0 " member? ] trim-tail ;
25 : read-c-string ( n -- str )
26 read [ zero? ] trim-tail "" like ;
28 : read-tar-header ( -- header )
30 100 read-c-string >>name
31 8 read-c-string trim-string oct> >>mode
32 8 read-c-string trim-string oct> >>uid
33 8 read-c-string trim-string oct> >>gid
34 12 read-c-string trim-string oct> >>size
35 12 read-c-string trim-string oct> >>mtime
36 8 read-c-string trim-string oct> >>checksum
38 100 read-c-string >>linkname
41 32 read-c-string >>uname
42 32 read-c-string >>gname
43 8 read trim-string oct> >>devmajor
44 8 read trim-string oct> >>devminor
45 155 read-c-string >>prefix ;
47 TYPED: checksum-header ( seq: byte-array -- n )
48 148 cut-slice 8 tail-slice [ 0 [ + ] reduce ] bi@ + 256 + >fixnum ;
50 : read-data-blocks ( header -- )
53 over size>> dup block-size <= [
57 [ block-size - ] change-size
65 ] if ; inline recursive
67 : parse-tar-header ( seq -- header )
68 dup checksum-header dup zero-checksum = [
75 binary [ read-tar-header ] with-byte-reader
77 ] dip = [ checksum-error ] unless
80 ERROR: unknown-typeflag ch ;
82 M: unknown-typeflag summary
83 ch>> [ "Unknown typeflag: " ] dip prefix ;
85 : read/write-blocks ( header path -- )
86 binary [ read-data-blocks ] with-file-writer ;
89 : typeflag-0 ( header -- )
90 dup name>> read/write-blocks ;
92 TUPLE: hard-link linkname name ;
93 C: <hard-link> hard-link
95 TUPLE: symbolic-link linkname name ;
96 C: <symbolic-link> symbolic-link
98 ! Hard link, don't call normalize-path
99 : typeflag-1 ( header -- )
100 [ linkname>> ] [ name>> ] bi <hard-link> save-link ;
102 ! Symlink, don't call normalize-path
103 : typeflag-2 ( header -- )
104 [ linkname>> ] [ name>> ] bi <symbolic-link> save-link ;
107 : typeflag-3 ( header -- ) unknown-typeflag ;
110 : typeflag-4 ( header -- ) unknown-typeflag ;
113 : typeflag-5 ( header -- )
114 name>> make-directories ;
117 : typeflag-6 ( header -- ) unknown-typeflag ;
120 : typeflag-7 ( header -- ) unknown-typeflag ;
122 ! Global extended header
123 : typeflag-8 ( header -- ) unknown-typeflag ;
126 : typeflag-9 ( header -- ) unknown-typeflag ;
128 ! Global POSIX header
129 : typeflag-g ( header -- )
130 ! Read something like: 52 comment=9f2a940965286754f3a34d5737c3097c05db8725
132 [ read-data-blocks ] with-string-writer drop ;
134 ! Extended POSIX header
135 : typeflag-x ( header -- ) unknown-typeflag ;
137 ! Solaris access control list
138 : typeflag-A ( header -- ) unknown-typeflag ;
141 : typeflag-D ( header -- ) unknown-typeflag ;
143 ! Solaris extended attribute file
144 : typeflag-E ( header -- ) unknown-typeflag ;
147 : typeflag-I ( header -- ) unknown-typeflag ;
150 : typeflag-K ( header -- ) unknown-typeflag ;
153 : typeflag-L ( header -- )
156 ! [ read-data-blocks ] with-string-writer
157 ! [ zero? ] trim-tail filename set
158 ! filename get make-directories ;
160 ! Multi volume continuation entry
161 : typeflag-M ( header -- ) unknown-typeflag ;
164 : typeflag-N ( header -- ) unknown-typeflag ;
167 : typeflag-S ( header -- ) unknown-typeflag ;
170 : typeflag-V ( header -- ) unknown-typeflag ;
172 ! Vendor extended header type
173 : typeflag-X ( header -- ) unknown-typeflag ;
176 block-size read dup length block-size = [
181 { CHAR: 0 [ typeflag-0 ] }
182 ! { CHAR: 1 [ typeflag-1 ] }
183 { CHAR: 2 [ typeflag-2 ] }
184 ! { CHAR: 3 [ typeflag-3 ] }
185 ! { CHAR: 4 [ typeflag-4 ] }
186 { CHAR: 5 [ typeflag-5 ] }
187 ! { CHAR: 6 [ typeflag-6 ] }
188 ! { CHAR: 7 [ typeflag-7 ] }
189 { CHAR: g [ typeflag-g ] }
190 ! { CHAR: x [ typeflag-x ] }
191 ! { CHAR: A [ typeflag-A ] }
192 ! { CHAR: D [ typeflag-D ] }
193 ! { CHAR: E [ typeflag-E ] }
194 ! { CHAR: I [ typeflag-I ] }
195 ! { CHAR: K [ typeflag-K ] }
196 { CHAR: L [ typeflag-L ] }
197 ! { CHAR: M [ typeflag-M ] }
198 ! { CHAR: N [ typeflag-N ] }
199 ! { CHAR: S [ typeflag-S ] }
200 ! { CHAR: V [ typeflag-V ] }
201 ! { CHAR: X [ typeflag-X ] }
208 GENERIC: do-link ( object -- )
211 [ linkname>> ] [ name>> ] bi make-hard-link ;
213 M: symbolic-link do-link
214 [ linkname>> ] [ name>> ] bi make-link ;
216 ! FIXME: linux tar calls unlinkat and makelinkat
219 [ name>> ?delete-file ] [ do-link ] bi
223 normalize-path dup parent-directory [
225 binary [ parse-tar ] with-file-reader