forked from ruricolist/serapeum
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathfiles.lisp
300 lines (253 loc) · 11.4 KB
/
files.lisp
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
(in-package :serapeum)
;;; Pathname types. These correspond to the predicates defined by
;;; UIOP.
(deftype wild-pathname ()
"A pathname with wild components."
'(and pathname (satisfies wild-pathname-p)))
(deftype non-wild-pathname ()
"A pathname without wild components."
'(or directory-pathname
(and pathname (not (satisfies wild-pathname-p)))))
(deftype absolute-pathname ()
'(and pathname (satisfies uiop:absolute-pathname-p)))
(deftype relative-pathname ()
'(and pathname (satisfies uiop:relative-pathname-p)))
(deftype directory-pathname ()
'(and pathname (satisfies uiop:directory-pathname-p)))
(deftype absolute-directory-pathname ()
'(and absolute-pathname directory-pathname))
(deftype file-pathname ()
'(and pathname (satisfies uiop:file-pathname-p)))
;;; logical-pathname is defined in CL.
(deftype physical-pathname ()
'(and pathname (not (satisfies logical-pathname-p))))
(defmacro with-open-files ((&rest args) &body body)
"A simple macro to open one or more files providing the streams for the BODY. The ARGS is a list of `(stream filespec options*)` as supplied to WITH-OPEN-FILE."
(case (length args)
((0)
`(progn ,@body))
((1)
`(with-open-file ,(first args) ,@body))
(t `(with-open-file ,(first args)
(with-open-files
,(rest args) ,@body)))))
(defun path-basename (pathname)
"Return the basename, that is:
- if it's a directory, the name of the directory,
- if it's a file, the name of the file including its type (extension)."
(first (last (pathname-directory (uiop:ensure-directory-pathname pathname)))))
(-> path-join (&rest (or string stream pathname))
(values pathname &optional))
(defun path-join (&rest pathnames)
"Build a pathname by merging from right to left.
With `path-join' you can pass the elements of the pathname being built
in the order they appear in it:
(path-join (user-homedir-pathname) config-dir config-file)
≡ (uiop:merge-pathnames* config-file
(uiop:merge-pathnames* config-dir
(user-homedir-pathname)))
Note that `path-join' does not coerce the parts of the pathname into
directories; you have to do that yourself.
(path-join \"dir1\" \"dir2\" \"file\") -> #p\"file\"
(path-join \"dir1/\" \"dir2/\" \"file\") -> #p\"dir1/dir2/file\"
Cf. `base-path-join' for a similar function with more intuitive
behavior."
(the pathname
(reduce (lambda (x y)
(uiop:merge-pathnames* y x))
pathnames
:initial-value (make-pathname))))
(-> base-path-join ((or string stream pathname) &rest (or string stream pathname))
(values pathname &optional))
(defun base-path-join (base &rest suffixes)
"Build a pathname by appending SUFFIXES to BASE.
For `path-join-base', the path on the left is always the *base* and
the path on the right is always the *suffix*. This means that even if
the right hand path is absolute, it will be treated as if it were
relative.
(base-path-join #p\"foo/bar\" #p\"/baz\")
=> #p\"foo/bar/baz\")
Also, a bare file name as a suffix does not override but is appended
to the accumulated file name. This includes the extension.
(base-path-join #p\"foo/bar\" \"baz\")
=> #p\"foo/barbaz\")
(base-path-join #p\"foo/bar.x\" \"baz.y\")
=> #p\"foo/bar.xbaz.y\")
See `path-join' for a similar function with more consistent behavior."
;; Contributed by Pierre Niedhardt (@ambrevar).
;; https://github.com/ruricolist/serapeum/issues/127
(if (null suffixes)
(the (values pathname &optional)
(uiop:ensure-pathname base))
(reduce (lambda (path1 path2)
(if (or (null (pathname-name path1))
(pathname-directory path2))
(uiop:merge-pathnames*
(uiop:relativize-pathname-directory
(uiop:ensure-pathname path2))
(uiop:ensure-pathname path1 :ensure-directory t))
(let ((new-base (string+ (path-basename path1)
(path-basename path2))))
(make-pathname :defaults path1
:type (pathname-type new-base)
:name (pathname-name new-base)))))
suffixes
:initial-value base)))
(defun write-stream-into-file (stream pathname &key (if-exists :error) if-does-not-exist)
"Read STREAM and write the contents into PATHNAME.
STREAM will be closed afterwards, so wrap it with
`make-concatenated-stream' if you want it left open."
(check-type pathname pathname)
(with-open-stream (in stream)
(with-output-to-file (out pathname
:element-type (stream-element-type in)
:if-exists if-exists
:if-does-not-exist if-does-not-exist)
(copy-stream in out)))
pathname)
(defun write-file-into-stream (pathname output &key (if-does-not-exist :error)
(external-format :default))
"Write the contents of FILE into STREAM."
(check-type pathname pathname)
(with-input-from-file (input pathname
:element-type (stream-element-type output)
:if-does-not-exist if-does-not-exist
:external-format external-format)
(copy-stream input output)))
(defun file= (file1 file2 &key (buffer-size 4096))
"Compare FILE1 and FILE2 octet by octet, \(possibly) using buffers
of BUFFER-SIZE."
(declare (ignorable buffer-size))
(let ((file1 (truename file1))
(file2 (truename file2)))
(or (equal file1 file2)
(and (= (file-size-in-octets file1)
(file-size-in-octets file2))
#+ccl (file=/mmap file1 file2)
#-ccl (file=/loop file1 file2 :buffer-size buffer-size)))))
#+ccl
(defun file=/mmap (file1 file2)
"Compare FILE1 and FILE2 by memory-mapping them and comparing them
as vectors."
(macrolet ((with-mmap ((var file) &body body)
`(let* ((,var (ccl:map-file-to-octet-vector ,file)))
(unwind-protect
(progn ,@body)
(ccl:unmap-ivector ,var)))))
(with-mmap (vec1 file1)
(with-mmap (vec2 file2)
;; The vector returned when CCL memory maps a file is a
;; displaced vector, because of alignment issues. But
;; `octet-vector=' takes a `:start' parameter, so we can
;; directly compare the underlying simple vectors.
(multiple-value-bind (vec1 start1)
(array-displacement vec1)
(multiple-value-bind (vec2 start2)
(array-displacement vec2)
(octet-vector= vec1 vec2
:start1 start1
:start2 start2)))))))
(defun file=/loop (file1 file2 &key (buffer-size 4096))
"Compare two files by looping over their contents using a buffer."
(declare
(type pathname file1 file2)
(type array-length buffer-size)
(optimize (safety 1) (debug 0) (compilation-speed 0)))
(flet ((make-buffer ()
(make-array buffer-size
:element-type 'octet
:initial-element 0)))
(declare (inline make-buffer))
(with-open-files ((file1 file1 :element-type 'octet :direction :input)
(file2 file2 :element-type 'octet :direction :input))
(and (= (file-length file1)
(file-length file2))
(locally (declare (optimize speed))
(loop with buffer1 = (make-buffer)
with buffer2 = (make-buffer)
for end1 = (read-sequence buffer1 file1)
for end2 = (read-sequence buffer2 file2)
until (or (zerop end1) (zerop end2))
always (and (= end1 end2)
(octet-vector= buffer1 buffer2
:end1 end1
:end2 end2))))))))
(defun file-size (file &key (element-type '(unsigned-byte 8)))
"The size of FILE, in units of ELEMENT-TYPE (defaults to bytes).
The size is computed by opening the file and getting the length of the
resulting stream.
If all you want is to read the file's size in octets from its
metadata, consider `trivial-file-size:file-size-in-octets' instead."
(check-type file (or string pathname))
(with-input-from-file (in file :element-type element-type)
(file-length in)))
(defconstant +pathsep+
(if (uiop:os-windows-p) #\; #\:)
"Path separator for this OS.")
(defun exe (p)
"If P, a pathname designator, has no extension, then, on Windows
only, add an extension of `.exe`."
(let* ((p (pathname p))
(type (pathname-type p)))
(if (and (uiop:os-windows-p)
(null type))
(make-pathname :type "exe"
:defaults p)
p)))
(defun $path ()
"Split the PATH environment variable."
(mapcar #'uiop:ensure-directory-pathname
;; This is enough; Neither Windows nor POSIX support
;; escaping the separator in $PATH.
(split-sequence +pathsep+
(uiop:getenv "PATH")
:remove-empty-subseqs t)))
(defun resolve-executable (p)
"Look for an executable using the PATH environment variable.
P is a pathname designator.
On Windows only, if P does not have an extension, it assumed to end in
`.exe`.
Note that this function does not check the current directory (even on
Windows) and it does not care if P is already an absolute pathname: it
only cares about its name and type."
(let* ((p (exe p))
(name (pathname-name p))
(type (pathname-type p)))
(loop for dir in ($path)
for pathname = (make-pathname :name name
:type type
:defaults dir)
when (uiop:file-exists-p pathname)
do (return pathname))))
(defun format-file-size-human-readable (stream file-size
&key flavor
(space (eql flavor :si))
(suffix (if (eql flavor :iec) "B" "")))
"Write FILE-SIZE, a file size in bytes, to STREAM, in human-readable form.
STREAM is interpreted as by `format'.
If FLAVOR is nil, kilobytes are 1024 bytes and SI prefixes are used.
If FLAVOR is `:si', kilobytes are 1000 bytes and SI prefixes are used.
If FLAVOR is `:iec', kilobytes are 1024 bytes and IEC prefixes (Ki,
Mi, etc.) are used.
If SPACE is non-nil, include a space between the number and the
prefix. (Defaults to T if FLAVOR is `:si'.)
SUFFIX is the suffix to use; defaults to B if FLAVOR is `:iec',
otherwise empty."
(check-type file-size (integer 0 *))
(if (zerop file-size)
(format stream "0")
(let ((flavor (if (null flavor) :file flavor)))
(multiple-value-bind (formatter args)
(human-size-formatter file-size :flavor flavor :space space)
(format stream "~?~a" formatter args suffix)))))
(defun file-size-human-readable (file &key flavor space suffix stream)
"Format the size of FILE (in octets) using `format-file-size-human-readable'.
The size of file is found by `trivial-file-size:file-size-in-octets'.
Inspired by the function of the same name in Emacs."
(let ((file-size (file-size-in-octets file)))
(format-file-size-human-readable
stream
file-size
:flavor flavor
:suffix suffix
:space space)))