123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276 |
- /*
- * 9p utilities
- *
- * Copyright IBM, Corp. 2017
- *
- * Authors:
- * Greg Kurz <groug@kaod.org>
- *
- * This work is licensed under the terms of the GNU GPL, version 2 or later.
- * See the COPYING file in the top-level directory.
- */
- #ifndef QEMU_9P_UTIL_H
- #define QEMU_9P_UTIL_H
- #include "qemu/error-report.h"
- #ifdef O_PATH
- #define O_PATH_9P_UTIL O_PATH
- #else
- #define O_PATH_9P_UTIL 0
- #endif
- #if !defined(CONFIG_LINUX)
- /*
- * Generates a Linux device number (a.k.a. dev_t) for given device major
- * and minor numbers.
- *
- * To be more precise: it generates a device number in glibc's format
- * (MMMM_Mmmm_mmmM_MMmm, 64 bits) actually, which is compatible with
- * Linux's format (mmmM_MMmm, 32 bits), as described in <bits/sysmacros.h>.
- */
- static inline uint64_t makedev_dotl(uint32_t dev_major, uint32_t dev_minor)
- {
- uint64_t dev;
- // from glibc sysmacros.h:
- dev = (((uint64_t) (dev_major & 0x00000fffu)) << 8);
- dev |= (((uint64_t) (dev_major & 0xfffff000u)) << 32);
- dev |= (((uint64_t) (dev_minor & 0x000000ffu)) << 0);
- dev |= (((uint64_t) (dev_minor & 0xffffff00u)) << 12);
- return dev;
- }
- #endif
- /*
- * Converts given device number from host's device number format to Linux
- * device number format. As both the size of type dev_t and encoding of
- * dev_t is system dependent, we have to convert them for Linux guests if
- * host is not running Linux.
- */
- static inline uint64_t host_dev_to_dotl_dev(dev_t dev)
- {
- #ifdef CONFIG_LINUX
- return dev;
- #else
- return makedev_dotl(major(dev), minor(dev));
- #endif
- }
- /* Translates errno from host -> Linux if needed */
- static inline int errno_to_dotl(int err) {
- #if defined(CONFIG_LINUX)
- /* nothing to translate (Linux -> Linux) */
- #elif defined(CONFIG_DARWIN)
- /*
- * translation mandatory for macOS hosts
- *
- * FIXME: Only most important errnos translated here yet, this should be
- * extended to as many errnos being translated as possible in future.
- */
- if (err == ENAMETOOLONG) {
- err = 36; /* ==ENAMETOOLONG on Linux */
- } else if (err == ENOTEMPTY) {
- err = 39; /* ==ENOTEMPTY on Linux */
- } else if (err == ELOOP) {
- err = 40; /* ==ELOOP on Linux */
- } else if (err == ENOATTR) {
- err = 61; /* ==ENODATA on Linux */
- } else if (err == ENOTSUP) {
- err = 95; /* ==EOPNOTSUPP on Linux */
- } else if (err == EOPNOTSUPP) {
- err = 95; /* ==EOPNOTSUPP on Linux */
- }
- #else
- #error Missing errno translation to Linux for this host system
- #endif
- return err;
- }
- #ifdef CONFIG_DARWIN
- #define qemu_fgetxattr(...) fgetxattr(__VA_ARGS__, 0, 0)
- #else
- #define qemu_fgetxattr fgetxattr
- #endif
- #define qemu_openat openat
- #define qemu_fstat fstat
- #define qemu_fstatat fstatat
- #define qemu_mkdirat mkdirat
- #define qemu_renameat renameat
- #define qemu_utimensat utimensat
- #define qemu_unlinkat unlinkat
- static inline void close_preserve_errno(int fd)
- {
- int serrno = errno;
- close(fd);
- errno = serrno;
- }
- /**
- * close_if_special_file() - Close @fd if neither regular file nor directory.
- *
- * @fd: file descriptor of open file
- * Return: 0 on regular file or directory, -1 otherwise
- *
- * CVE-2023-2861: Prohibit opening any special file directly on host
- * (especially device files), as a compromised client could potentially gain
- * access outside exported tree under certain, unsafe setups. We expect
- * client to handle I/O on special files exclusively on guest side.
- */
- static inline int close_if_special_file(int fd)
- {
- struct stat stbuf;
- if (qemu_fstat(fd, &stbuf) < 0) {
- close_preserve_errno(fd);
- return -1;
- }
- if (!S_ISREG(stbuf.st_mode) && !S_ISDIR(stbuf.st_mode)) {
- error_report_once(
- "9p: broken or compromised client detected; attempt to open "
- "special file (i.e. neither regular file, nor directory)"
- );
- close(fd);
- errno = ENXIO;
- return -1;
- }
- return 0;
- }
- static inline int openat_dir(int dirfd, const char *name)
- {
- return qemu_openat(dirfd, name,
- O_DIRECTORY | O_RDONLY | O_NOFOLLOW | O_PATH_9P_UTIL);
- }
- static inline int openat_file(int dirfd, const char *name, int flags,
- mode_t mode)
- {
- int fd, serrno, ret;
- #ifndef CONFIG_DARWIN
- again:
- #endif
- fd = qemu_openat(dirfd, name, flags | O_NOFOLLOW | O_NOCTTY | O_NONBLOCK,
- mode);
- if (fd == -1) {
- #ifndef CONFIG_DARWIN
- if (errno == EPERM && (flags & O_NOATIME)) {
- /*
- * The client passed O_NOATIME but we lack permissions to honor it.
- * Rather than failing the open, fall back without O_NOATIME. This
- * doesn't break the semantics on the client side, as the Linux
- * open(2) man page notes that O_NOATIME "may not be effective on
- * all filesystems". In particular, NFS and other network
- * filesystems ignore it entirely.
- */
- flags &= ~O_NOATIME;
- goto again;
- }
- #endif
- return -1;
- }
- /* Only if O_PATH is not set ... */
- if (!(flags & O_PATH_9P_UTIL)) {
- /*
- * Prevent I/O on special files (device files, etc.) on host side,
- * however it is safe and required to allow opening them with O_PATH,
- * as this is limited to (required) path based operations only.
- */
- if (close_if_special_file(fd) < 0) {
- return -1;
- }
- serrno = errno;
- /*
- * O_NONBLOCK was only needed to open the file. Let's drop it. We don't
- * do that with O_PATH since fcntl(F_SETFL) isn't supported, and
- * openat() ignored it anyway.
- */
- ret = fcntl(fd, F_SETFL, flags);
- assert(!ret);
- errno = serrno;
- }
- return fd;
- }
- ssize_t fgetxattrat_nofollow(int dirfd, const char *path, const char *name,
- void *value, size_t size);
- int fsetxattrat_nofollow(int dirfd, const char *path, const char *name,
- void *value, size_t size, int flags);
- ssize_t flistxattrat_nofollow(int dirfd, const char *filename,
- char *list, size_t size);
- ssize_t fremovexattrat_nofollow(int dirfd, const char *filename,
- const char *name);
- /*
- * Darwin has d_seekoff, which appears to function similarly to d_off.
- * However, it does not appear to be supported on all file systems,
- * so ensure it is manually injected earlier and call here when
- * needed.
- */
- static inline off_t qemu_dirent_off(struct dirent *dent)
- {
- #ifdef CONFIG_DARWIN
- return dent->d_seekoff;
- #else
- return dent->d_off;
- #endif
- }
- /**
- * qemu_dirent_dup() - Duplicate directory entry @dent.
- *
- * @dent: original directory entry to be duplicated
- * Return: duplicated directory entry which should be freed with g_free()
- *
- * It is highly recommended to use this function instead of open coding
- * duplication of dirent objects, because the actual struct dirent
- * size may be bigger or shorter than sizeof(struct dirent) and correct
- * handling is platform specific (see gitlab issue #841).
- */
- static inline struct dirent *qemu_dirent_dup(struct dirent *dent)
- {
- size_t sz = 0;
- #if defined _DIRENT_HAVE_D_RECLEN
- /* Avoid use of strlen() if platform supports d_reclen. */
- sz = dent->d_reclen;
- #endif
- /*
- * Test sz for zero even if d_reclen is available
- * because some drivers may set d_reclen to zero.
- */
- if (sz == 0) {
- /* Fallback to the most portable way. */
- sz = offsetof(struct dirent, d_name) +
- strlen(dent->d_name) + 1;
- }
- return g_memdup(dent, sz);
- }
- /*
- * As long as mknodat is not available on macOS, this workaround
- * using pthread_fchdir_np is needed. qemu_mknodat is defined in
- * os-posix.c. pthread_fchdir_np is weakly linked here as a guard
- * in case it disappears in future macOS versions, because it is
- * is a private API.
- */
- #if defined CONFIG_DARWIN && defined CONFIG_PTHREAD_FCHDIR_NP
- int pthread_fchdir_np(int fd) __attribute__((weak_import));
- #endif
- int qemu_mknodat(int dirfd, const char *filename, mode_t mode, dev_t dev);
- /*
- * Returns a newly allocated string presentation of open() flags, intended
- * for debugging (tracing) purposes only.
- */
- char *qemu_open_flags_tostr(int flags);
- #endif
|