2 * Copyright (c) 1983, 1993
3 * The Regents of the University of California. All rights reserved.
5 * Redistribution and use in source and binary forms, with or without
6 * modification, are permitted provided that the following conditions
8 * 1. Redistributions of source code must retain the above copyright
9 * notice, this list of conditions and the following disclaimer.
10 * 2. Redistributions in binary form must reproduce the above copyright
11 * notice, this list of conditions and the following disclaimer in the
12 * documentation and/or other materials provided with the distribution.
13 * 4. Neither the name of the University nor the names of its contributors
14 * may be used to endorse or promote products derived from this software
15 * without specific prior written permission.
17 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
18 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
19 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
20 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
21 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
22 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
23 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
24 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
25 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
26 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
30 #if defined(LIBC_SCCS) && !defined(lint)
31 static char sccsid
[] = "@(#)opendir.c 8.8 (Berkeley) 5/1/95";
32 #endif /* LIBC_SCCS and not lint */
33 #include <sys/cdefs.h>
34 __FBSDID("$FreeBSD$");
36 #include "namespace.h"
37 #include <sys/param.h>
38 #include <sys/mount.h>
40 #include <sys/sysctl.h>
49 #include "un-namespace.h"
54 __kernel_supports_unionfs(void)
56 static int8_t kernel_supports_unionfs
= -1;
57 if (kernel_supports_unionfs
== -1) {
59 size_t len
= sizeof(value
);
60 sysctlbyname("kern.secure_kernel", &value
, &len
, NULL
, 0);
61 kernel_supports_unionfs
= !value
;
63 return kernel_supports_unionfs
;
67 __fd_is_on_union_mount(int fd
)
72 rc
= fstatfs(fd
, &stbuf
);
76 return (stbuf
.f_flags
& MNT_UNION
) != 0;
79 static DIR * __opendir_common(int, int, bool);
85 opendir(const char *name
)
88 return (__opendir2(name
, DTF_HIDEW
|DTF_NODUP
));
92 * Open a directory with existing file descriptor.
99 /* Check that fd is associated with a directory. */
100 if (_fstat(fd
, &statb
) != 0)
102 if (!S_ISDIR(statb
.st_mode
)) {
106 /* Make sure CLOEXEC is set on the fd */
107 if (_fcntl(fd
, F_SETFD
, FD_CLOEXEC
) == -1)
109 return (__opendir_common(fd
, DTF_HIDEW
|DTF_NODUP
, true));
113 __opendir2(const char *name
, int flags
)
119 if ((flags
& (__DTF_READALL
| __DTF_SKIPREAD
)) != 0)
121 if ((fd
= _open(name
,
122 O_RDONLY
| O_NONBLOCK
| O_DIRECTORY
| O_CLOEXEC
)) == -1)
125 dir
= __opendir_common(fd
, flags
, false);
135 opendir_compar(const void *p1
, const void *p2
)
138 return (strcmp((*(const struct dirent
**)p1
)->d_name
,
139 (*(const struct dirent
**)p2
)->d_name
));
143 * For a directory at the top of a unionfs stack, the entire directory's
144 * contents are read and cached locally until the next call to rewinddir().
145 * For the fdopendir() case, the initial seek position must be preserved.
146 * For rewinddir(), the full directory should always be re-read from the
149 * If an error occurs, the existing buffer and state of 'dirp' is left
153 _filldir(DIR *dirp
, bool use_current_pos
)
156 char *buf
, *ddptr
, *ddeptr
;
158 int fd2
, incr
, len
, n
, saved_errno
, space
;
166 * Use the system page size if that is a multiple of DIRBLKSIZ.
167 * Hopefully this can be a big win someday by allowing page
168 * trades to user space to be done by _getdirentries().
170 incr
= getpagesize();
171 if ((incr
% DIRBLKSIZ
) != 0)
175 * The strategy here is to read all the directory
176 * entries into a buffer, sort the buffer, and
177 * remove duplicate entries by setting the inode
180 * We reopen the directory because _getdirentries()
181 * on a MNT_UNION mount modifies the open directory,
182 * making it refer to the lower directory after the
183 * upper directory's entries are exhausted.
184 * This would otherwise break software that uses
185 * the directory descriptor for fchdir or *at
186 * functions, such as fts.c.
188 if ((fd2
= openat(dirp
->dd_fd
, ".", O_RDONLY
| O_CLOEXEC
)) == -1)
191 if (use_current_pos
) {
192 pos
= lseek(dirp
->dd_fd
, 0, SEEK_CUR
);
193 if (pos
== -1 || lseek(fd2
, pos
, SEEK_SET
) == -1) {
203 * Always make at least DIRBLKSIZ bytes
204 * available to _getdirentries
206 if (space
< DIRBLKSIZ
) {
209 buf
= reallocf(buf
, len
);
216 ddptr
= buf
+ (len
- space
);
219 #if __DARWIN_64_BIT_INO_T
220 n
= (int)__getdirentries64(fd2
, ddptr
, space
, &dirp
->dd_td
->seekoff
);
221 #else /* !__DARWIN_64_BIT_INO_T */
222 n
= _getdirentries(fd2
, ddptr
, space
, &dirp
->dd_seek
);
223 #endif /* __DARWIN_64_BIT_INO_T */
240 * There is now a buffer full of (possibly) duplicate
246 * Go round this loop twice...
248 * Scan through the buffer, counting entries.
249 * On the second pass, save pointers to each one.
250 * Then sort the pointers and remove duplicate names.
255 while (ddptr
< ddeptr
) {
258 dp
= (struct dirent
*) ddptr
;
261 if ((dp
->d_reclen
<= 0) ||
262 (dp
->d_reclen
> (ddeptr
+ 1 - ddptr
)))
264 ddptr
+= dp
->d_reclen
;
276 * This sort must be stable.
278 mergesort(dpv
, n
, sizeof(*dpv
), opendir_compar
);
284 * Scan through the buffer in sort order,
285 * zapping the inode number of any
288 for (n
= 0; dpv
[n
]; n
++) {
289 struct dirent
*dp
= dpv
[n
];
292 strcmp(dp
->d_name
, xp
->d_name
)) {
297 if (dp
->d_type
== DT_WHT
&&
298 (dirp
->dd_flags
& DTF_HIDEW
))
305 dpv
= malloc((n
+1) * sizeof(struct dirent
*));
312 dirp
->dd_size
= ddptr
- dirp
->dd_buf
;
318 * Common routine for opendir(3), __opendir2(3) and fdopendir(3).
321 __opendir_common(int fd
, int flags
, bool use_current_pos
)
327 if ((dirp
= malloc(sizeof(DIR) + sizeof(struct _telldir
))) == NULL
)
332 dirp
->dd_flags
= flags
;
334 dirp
->dd_lock
= (pthread_mutex_t
)PTHREAD_MUTEX_INITIALIZER
;
335 dirp
->dd_td
= (struct _telldir
*)((char *)dirp
+ sizeof(DIR));
336 LIST_INIT(&dirp
->dd_td
->td_locq
);
337 dirp
->dd_td
->td_loccnt
= 0;
340 * Determine whether this directory is the top of a union stack.
342 if ((flags
& DTF_NODUP
) && __kernel_supports_unionfs()) {
343 unionstack
= __fd_is_on_union_mount(fd
);
351 if (!_filldir(dirp
, use_current_pos
))
353 dirp
->dd_flags
|= __DTF_READALL
;
356 * Start with a small-ish size to avoid allocating full pages.
357 * readdir() will allocate a larger buffer if it didn't fit
358 * to stay fast for large directories.
360 _Static_assert(GETDIRENTRIES64_EXTENDED_BUFSIZE
<= READDIR_INITIAL_SIZE
,
361 "Make sure we'll get extended metadata");
362 dirp
->dd_len
= READDIR_INITIAL_SIZE
;
363 dirp
->dd_buf
= malloc(dirp
->dd_len
);
364 if (dirp
->dd_buf
== NULL
)
366 if (use_current_pos
) {
368 * Read the first batch of directory entries
369 * to prime dd_seek. This also checks if the
370 * fd passed to fdopendir() is a directory.
372 #if __DARWIN_64_BIT_INO_T
374 * sufficiently recent kernels when the buffer is large enough,
375 * will use the last bytes of the buffer to return status.
377 * To support older kernels:
378 * - make sure it's 0 initialized
379 * - make sure it's past `dd_size` before reading it
381 getdirentries64_flags_t
*gdeflags
=
382 (getdirentries64_flags_t
*)(dirp
->dd_buf
+ dirp
->dd_len
-
383 sizeof(getdirentries64_flags_t
));
385 dirp
->dd_size
= (long)__getdirentries64(dirp
->dd_fd
,
386 dirp
->dd_buf
, dirp
->dd_len
, &dirp
->dd_td
->seekoff
);
387 if (dirp
->dd_size
>= 0 &&
388 dirp
->dd_size
<= dirp
->dd_len
- sizeof(getdirentries64_flags_t
)) {
389 if (*gdeflags
& GETDIRENTRIES64_EOF
) {
390 dirp
->dd_flags
|= __DTF_ATEND
;
393 #else /* !__DARWIN_64_BIT_INO_T */
394 dirp
->dd_size
= _getdirentries(dirp
->dd_fd
,
395 dirp
->dd_buf
, dirp
->dd_len
, &dirp
->dd_seek
);
396 #endif /* __DARWIN_64_BIT_INO_T */
397 if (dirp
->dd_size
< 0) {
402 dirp
->dd_flags
|= __DTF_SKIPREAD
;
405 #if __DARWIN_64_BIT_INO_T
406 dirp
->dd_td
->seekoff
= 0;
407 #else /* !__DARWIN_64_BIT_INO_T */
409 #endif /* __DARWIN_64_BIT_INO_T */