1 ;;;; pathname parsing for Unix filesystems
3 ;;;; This software is part of the SBCL system. See the README file for
6 ;;;; This software is derived from the CMU CL system, which was
7 ;;;; written at Carnegie Mellon University and released into the
8 ;;;; public domain. The software is in the public domain and is
9 ;;;; provided with absolutely no warranty. See the COPYING and CREDITS
10 ;;;; files for more information.
12 (in-package "SB!IMPL")
14 ;;; Take a string and return a list of cons cells that mark the char
15 ;;; separated subseq. The first value is true if absolute directories
17 (defun split-at-slashes (namestr start end)
18 (declare (type simple-string namestr)
19 (type index start end))
20 (let ((absolute (and (/= start end)
21 (char= (schar namestr start) #\/))))
24 ;; Next, split the remainder into slash-separated chunks.
27 (let ((slash (position #\/ namestr :start start :end end)))
28 (pieces (cons start (or slash end)))
31 (setf start (1+ slash))))
32 (values absolute (pieces)))))
34 (defun parse-unix-namestring (namestring start end)
35 (declare (type simple-string namestring)
36 (type index start end))
37 (setf namestring (coerce namestring 'simple-string))
38 (multiple-value-bind (absolute pieces)
39 (split-at-slashes namestring start end)
40 (multiple-value-bind (name type version)
41 (let* ((tail (car (last pieces)))
42 (tail-start (car tail))
43 (tail-end (cdr tail)))
44 (unless (= tail-start tail-end)
45 (setf pieces (butlast pieces))
46 (extract-name-type-and-version namestring tail-start tail-end)))
49 (let ((position (position-if (lambda (char)
50 (or (char= char (code-char 0))
54 (error 'namestring-parse-error
55 :complaint "can't embed #\\Nul or #\\/ in Unix namestring"
56 :namestring namestring
58 ;; Now we have everything we want. So return it.
59 (values nil ; no host for Unix namestrings
60 nil ; no device for Unix namestrings
62 (dolist (piece pieces)
63 (let ((piece-start (car piece))
64 (piece-end (cdr piece)))
65 (unless (= piece-start piece-end)
66 (cond ((string= namestring ".."
70 ((string= namestring "**"
73 (dirs :wild-inferiors))
75 (dirs (maybe-make-pattern namestring
79 (cons :absolute (dirs)))
81 (cons :relative (dirs)))
88 (defun parse-native-unix-namestring (namestring start end as-directory)
89 (declare (type simple-string namestring)
90 (type index start end))
91 (setf namestring (coerce namestring 'simple-string))
92 (multiple-value-bind (absolute ranges)
93 (split-at-slashes namestring start end)
94 (let* ((components (loop for ((start . end) . rest) on ranges
95 for piece = (subseq namestring start end)
96 collect (if (and (string= piece "..") rest)
99 (directory (if (and as-directory
100 (string/= "" (car (last components))))
102 (butlast components)))
105 (let* ((end (first (last components)))
106 (dot (position #\. end :from-end t)))
107 ;; FIXME: can we get this dot-interpretation knowledge
108 ;; from existing code? EXTRACT-NAME-TYPE-AND-VERSION
109 ;; does slightly more work than that.
114 (list (subseq end 0 dot) (subseq end (1+ dot))))
119 (cons (if absolute :absolute :relative) directory)
120 (first name-and-type)
121 (second name-and-type)
124 (/show0 "filesys.lisp 300")
126 (defun unparse-unix-host (pathname)
127 (declare (type pathname pathname)
129 ;; this host designator needs to be recognized as a physical host in
130 ;; PARSE-NAMESTRING. Until sbcl-0.7.3.x, we had "Unix" here, but
131 ;; that's a valid Logical Hostname, so that's a bad choice. -- CSR,
135 (defun unparse-unix-piece (thing)
139 (let* ((srclen (length thing))
142 (case (schar thing i)
145 (let ((result (make-string dstlen))
147 (dotimes (src srclen)
148 (let ((char (schar thing src)))
151 (setf (schar result dst) #\\)
153 (setf (schar result dst) char)
158 (dolist (piece (pattern-pieces thing))
172 (strings (cdr piece))
175 (error "invalid pattern piece: ~S" piece))))))
180 (defun unparse-unix-directory-list (directory)
181 (declare (type list directory))
184 (ecase (pop directory)
190 (dolist (dir directory)
195 (error ":BACK cannot be represented in namestrings."))
196 ((member :wild-inferiors)
198 ((or simple-string pattern (member :wild))
199 (pieces (unparse-unix-piece dir))
202 (error "invalid directory component: ~S" dir)))))
203 (apply #'concatenate 'simple-string (pieces))))
205 (defun unparse-unix-directory (pathname)
206 (declare (type pathname pathname))
207 (unparse-unix-directory-list (%pathname-directory pathname)))
209 (defun unparse-unix-file (pathname)
210 (declare (type pathname pathname))
212 (let* ((name (%pathname-name pathname))
213 (type (%pathname-type pathname))
214 (type-supplied (not (or (null type) (eq type :unspecific)))))
215 ;; Note: by ANSI 19.3.1.1.5, we ignore the version slot when
216 ;; translating logical pathnames to a filesystem without
217 ;; versions (like Unix).
219 (when (and (null type)
222 (position #\. name :start 1))
223 (error "too many dots in the name: ~S" pathname))
224 (when (and (typep name 'string)
226 (error "name is of length 0: ~S" pathname))
227 (strings (unparse-unix-piece name)))
230 (error "cannot specify the type without a file: ~S" pathname))
231 (when (typep type 'simple-string)
232 (when (position #\. type)
233 (error "type component can't have a #\. inside: ~S" pathname)))
235 (strings (unparse-unix-piece type))))
236 (apply #'concatenate 'simple-string (strings))))
238 (/show0 "filesys.lisp 406")
240 (defun unparse-unix-namestring (pathname)
241 (declare (type pathname pathname))
242 (concatenate 'simple-string
243 (unparse-unix-directory pathname)
244 (unparse-unix-file pathname)))
246 (defun unparse-native-unix-namestring (pathname as-file)
247 (declare (type pathname pathname))
248 (let* ((directory (pathname-directory pathname))
249 (name (pathname-name pathname))
250 (name-present-p (typep name '(not (member nil :unspecific))))
251 (name-string (if name-present-p name ""))
252 (type (pathname-type pathname))
253 (type-present-p (typep type '(not (member nil :unspecific))))
254 (type-string (if type-present-p type "")))
258 (with-output-to-string (s)
260 (ecase (car directory)
261 (:absolute (write-char #\/ s))
263 (loop for (piece . subdirs) on (cdr directory)
265 ((member :up) (write-string ".." s))
266 (string (write-string piece s))
267 (t (error "ungood directory segment in NATIVE-NAMESTRING: ~S"
269 if (or subdirs (stringp name))
270 do (write-char #\/ s)
276 (unless (stringp name-string) ;some kind of wild field
277 (error "ungood name component in NATIVE-NAMESTRING: ~S" name))
278 (write-string name-string s)
280 (unless (stringp type-string) ;some kind of wild field
281 (error "ungood type component in NATIVE-NAMESTRING: ~S" type))
283 (write-string type-string s)))
284 (when type-present-p ; type without a name
286 "type component without a name component in NATIVE-NAMESTRING: ~S"
290 (defun unparse-unix-enough (pathname defaults)
291 (declare (type pathname pathname defaults))
293 (error "~S cannot be represented relative to ~S."
296 (let* ((pathname-directory (%pathname-directory pathname))
297 (defaults-directory (%pathname-directory defaults))
298 (prefix-len (length defaults-directory))
300 (cond ((null pathname-directory) '(:relative))
301 ((eq (car pathname-directory) :relative)
303 ((and (> prefix-len 0)
304 (>= (length pathname-directory) prefix-len)
305 (compare-component (subseq pathname-directory
308 ;; Pathname starts with a prefix of default. So
309 ;; just use a relative directory from then on out.
310 (cons :relative (nthcdr prefix-len pathname-directory)))
311 ((eq (car pathname-directory) :absolute)
312 ;; We are an absolute pathname, so we can just use it.
315 (bug "Bad fallthrough in ~S" 'unparse-unix-enough)))))
316 (strings (unparse-unix-directory-list result-directory)))
317 (let* ((pathname-type (%pathname-type pathname))
318 (type-needed (and pathname-type
319 (not (eq pathname-type :unspecific))))
320 (pathname-name (%pathname-name pathname))
321 (name-needed (or type-needed
323 (not (compare-component pathname-name
327 (unless pathname-name (lose))
328 (when (and (null pathname-type)
329 (typep pathname-name 'simple-string)
330 (position #\. pathname-name :start 1))
331 (error "too many dots in the name: ~S" pathname))
332 (strings (unparse-unix-piece pathname-name)))
334 (when (or (null pathname-type) (eq pathname-type :unspecific))
336 (when (typep pathname-type 'simple-string)
337 (when (position #\. pathname-type)
338 (error "type component can't have a #\. inside: ~S" pathname)))
340 (strings (unparse-unix-piece pathname-type))))
341 (apply #'concatenate 'simple-string (strings)))))
343 (defun simplify-unix-namestring (src)
344 (declare (type simple-string src))
345 (let* ((src-len (length src))
346 (dst (make-string src-len :element-type 'character))
350 (macrolet ((deposit (char)
352 (setf (schar dst dst-len) ,char)
354 (dotimes (src-index src-len)
355 (let ((char (schar src src-index)))
356 (cond ((char= char #\.)
363 ;; either ``/...' or ``...//...'
365 (setf last-slash dst-len)
368 ;; either ``./...'' or ``..././...''
373 ((and last-slash (not (zerop last-slash)))
374 ;; There is something before this ..
375 (let ((prev-prev-slash
376 (position #\/ dst :end last-slash :from-end t)))
377 (cond ((and (= (+ (or prev-prev-slash 0) 2)
379 (char= (schar dst (- last-slash 2)) #\.)
380 (char= (schar dst (1- last-slash)) #\.))
381 ;; The something before this .. is another ..
383 (setf last-slash dst-len))
385 ;; The something is some directory or other.
390 (setf last-slash prev-prev-slash)))))
392 ;; There is nothing before this .., so we need to keep it
393 (setf last-slash dst-len)
396 ;; something other than a dot between slashes
397 (setf last-slash dst-len)
402 (setf (schar dst dst-len) char)
404 (when (and last-slash (not (zerop last-slash)))
407 ;; We've got ``foobar/.''
410 ;; We've got ``foobar/..''
411 (unless (and (>= last-slash 2)
412 (char= (schar dst (1- last-slash)) #\.)
413 (char= (schar dst (- last-slash 2)) #\.)
415 (char= (schar dst (- last-slash 3)) #\/)))
416 (let ((prev-prev-slash
417 (position #\/ dst :end last-slash :from-end t)))
419 (setf dst-len (1+ prev-prev-slash))
420 (return-from simplify-unix-namestring
421 (coerce "./" 'simple-string))))))))
422 (cond ((zerop dst-len)
427 (subseq dst 0 dst-len)))))