From: Darrick J. Wong <djwong@xxxxxxxxxx> The upper level fuse library creates a separate node object for every (i)node referenced by a directory entry. Unfortunately, it doesn't account for the possibility of hardlinks, which means that we can create multiple nodeids that refer to the same hardlinked inode. Inode locking in iomap mode in the kernel relies there only being one inode object for a hardlinked file, so we cannot allow anyone to hardlink an iomap file. The client had better not turn on iomap for an existing hardlinked file. Signed-off-by: "Darrick J. Wong" <djwong@xxxxxxxxxx> --- include/fuse.h | 18 ++++++++++ lib/fuse.c | 90 +++++++++++++++++++++++++++++++++++++++++++----- lib/fuse_versionscript | 2 + 3 files changed, 101 insertions(+), 9 deletions(-) diff --git a/include/fuse.h b/include/fuse.h index 7256f43fd5c39a..4c4fff837437c8 100644 --- a/include/fuse.h +++ b/include/fuse.h @@ -1415,6 +1415,24 @@ int fuse_fs_iomap_device_add(int fd, unsigned int flags); */ int fuse_fs_iomap_device_remove(int device_id); +/** + * Decide if we can enable iomap mode for a particular file for an upper-level + * fuse server. + * + * @param statbuf stat information for the file. + * @return true if it can be enabled, false if not. + */ +bool fuse_fs_can_enable_iomap(const struct stat *statbuf); + +/** + * Decide if we can enable iomap mode for a particular file for an upper-level + * fuse server. + * + * @param statxbuf statx information for the file. + * @return true if it can be enabled, false if not. + */ +bool fuse_fs_can_enable_iomapx(const struct statx *statxbuf); + int fuse_notify_poll(struct fuse_pollhandle *ph); /** diff --git a/lib/fuse.c b/lib/fuse.c index 6b211084e2175a..cbf2c5d3a67895 100644 --- a/lib/fuse.c +++ b/lib/fuse.c @@ -3249,10 +3249,66 @@ static void fuse_lib_rename(fuse_req_t req, fuse_ino_t olddir, reply_err(req, err); } +/* + * Decide if file IO for this inode can use iomap. + * + * The upper level libfuse creates internal node ids that have nothing to do + * with the ext2_ino_t that we give it. These internal node ids are what + * actually gets igetted in the kernel, which means that there can be multiple + * fuse_inode objects in the kernel for a single hardlinked inode in the fuse + * server. + * + * What this means, horrifyingly, is that on a fuse filesystem that supports + * hard links, the in-kernel i_rwsem does not protect against concurrent writes + * between files that point to the same inode. That in turn means that the + * file mode and size can get desynchronized between the multiple fuse_inode + * objects. This also means that we cannot cache iomaps in the kernel AT ALL + * because the caches will get out of sync, leading to WARN_ONs from the iomap + * zeroing code and probably data corruption after that. + * + * Therefore, libfuse must never create hardlinks of iomap files, and the + * predicates below allow fuse servers to decide if they can turn on iomap for + * existing hardlinked files. + */ +bool fuse_fs_can_enable_iomap(const struct stat *statbuf) +{ + struct fuse_context *ctxt = fuse_get_context(); + struct fuse_session *se = fuse_get_session(ctxt->fuse); + + if (!(se->conn.want_ext & FUSE_CAP_IOMAP)) + return false; + + return statbuf->st_nlink < 2; +} + +bool fuse_fs_can_enable_iomapx(const struct statx *statxbuf) +{ + struct fuse_context *ctxt = fuse_get_context(); + struct fuse_session *se = fuse_get_session(ctxt->fuse); + + if (!(se->conn.want_ext & FUSE_CAP_IOMAP)) + return false; + + return statxbuf->stx_nlink < 2; +} + +static bool fuse_lib_can_link(fuse_req_t req, fuse_ino_t ino) +{ + struct fuse *f = req_fuse_prepare(req); + struct node *node; + + if (!(req->se->conn.want_ext & FUSE_CAP_IOMAP)) + return true; + + node = get_node(f, ino); + return !(node->iflags & FUSE_IFLAG_IOMAP); +} + static void fuse_lib_link(fuse_req_t req, fuse_ino_t ino, fuse_ino_t newparent, const char *newname) { struct fuse *f = req_fuse_prepare(req); + struct fuse_intr_data d; struct fuse_entry_param e; char *oldpath; char *newpath; @@ -3261,17 +3317,33 @@ static void fuse_lib_link(fuse_req_t req, fuse_ino_t ino, fuse_ino_t newparent, err = get_path2(f, ino, NULL, newparent, newname, &oldpath, &newpath, NULL, NULL); - if (!err) { - struct fuse_intr_data d; + if (err) + goto out_reply; - fuse_prepare_interrupt(f, req, &d); - err = fuse_fs_link(f->fs, oldpath, newpath); - if (!err) - err = lookup_path(f, newparent, newname, newpath, - &e, &iflags, NULL); - fuse_finish_interrupt(f, req, &d); - free_path2(f, ino, newparent, NULL, NULL, oldpath, newpath); + /* + * The upper level fuse library creates a separate node object for + * every (i)node referenced by a directory entry. Unfortunately, it + * doesn't account for the possibility of hardlinks, which means that + * we can create multiple nodeids that refer to the same hardlinked + * inode. Inode locking in iomap mode in the kernel relies there only + * being one inode object for a hardlinked file, so we cannot allow + * anyone to hardlink an iomap file. The client had better not turn on + * iomap for an existing hardlinked file. + */ + if (!fuse_lib_can_link(req, ino)) { + err = -EPERM; + goto out_path; } + + fuse_prepare_interrupt(f, req, &d); + err = fuse_fs_link(f->fs, oldpath, newpath); + if (!err) + err = lookup_path(f, newparent, newname, newpath, + &e, &iflags, NULL); + fuse_finish_interrupt(f, req, &d); +out_path: + free_path2(f, ino, newparent, NULL, NULL, oldpath, newpath); +out_reply: reply_entry(req, &e, iflags, err); } diff --git a/lib/fuse_versionscript b/lib/fuse_versionscript index df78723e0f2518..aa16efdd8a9879 100644 --- a/lib/fuse_versionscript +++ b/lib/fuse_versionscript @@ -229,6 +229,8 @@ FUSE_3.99 { fuse_reply_create_iflags; fuse_reply_entry_iflags; fuse_add_direntry_plus_iflags; + fuse_fs_can_enable_iomap; + fuse_fs_can_enable_iomapx; } FUSE_3.18; # Local Variables: