The implementation of LOOKUP_HANDLE modifies the LOOKUP operation to include
an extra inarg: the file handle for the parent directory (if it is
available). Also, because fuse_entry_out now has a extra variable size
struct (the actual handle), it also sets the out_argvar flag to true.
Most of the other modifications in this patch are a fallout from these
changes: because fuse_entry_out has been modified to include a variable size
struct, every operation that receives such a parameter have to take this
into account:
CREATE, LINK, LOOKUP, MKDIR, MKNOD, READDIRPLUS, SYMLINK, TMPFILE
Signed-off-by: Luis Henriques <luis@igalia.com>
---
fs/fuse/dev.c | 16 +++++++
fs/fuse/dir.c | 87 ++++++++++++++++++++++++++++++---------
fs/fuse/fuse_i.h | 34 +++++++++++++--
fs/fuse/inode.c | 69 +++++++++++++++++++++++++++----
fs/fuse/readdir.c | 10 ++---
include/uapi/linux/fuse.h | 8 ++++
6 files changed, 189 insertions(+), 35 deletions(-)
diff --git a/fs/fuse/dev.c b/fs/fuse/dev.c
index 629e8a043079..fc6acf45ae27 100644
--- a/fs/fuse/dev.c
+++ b/fs/fuse/dev.c
@@ -606,6 +606,22 @@ static void fuse_adjust_compat(struct fuse_conn *fc, struct fuse_args *args)
if (fc->minor < 4 && args->opcode == FUSE_STATFS)
args->out_args[0].size = FUSE_COMPAT_STATFS_SIZE;
+ if (fc->minor < 45) {
+ switch (args->opcode) {
+ case FUSE_CREATE:
+ case FUSE_LINK:
+ case FUSE_LOOKUP:
+ case FUSE_MKDIR:
+ case FUSE_MKNOD:
+ /* XXX case FUSE_READDIRPLUS: */
+ case FUSE_SYMLINK:
+ case FUSE_TMPFILE:
+ if (!WARN_ON_ONCE(args->in_numargs == 0))
+ args->in_numargs--;
+ args->out_args[0].size = FUSE_COMPAT_45_ENTRY_OUT_SIZE;
+ break;
+ }
+ }
if (fc->minor < 9) {
switch (args->opcode) {
case FUSE_LOOKUP:
diff --git a/fs/fuse/dir.c b/fs/fuse/dir.c
index e3fd5d148741..a6edb444180f 100644
--- a/fs/fuse/dir.c
+++ b/fs/fuse/dir.c
@@ -169,7 +169,8 @@ static void fuse_invalidate_entry(struct dentry *entry)
}
static void fuse_lookup_init(struct fuse_conn *fc, struct fuse_args *args,
- u64 nodeid, const struct qstr *name,
+ u64 nodeid, struct inode *dir,
+ const struct qstr *name,
struct fuse_entry_out *outarg)
{
args->opcode = FUSE_LOOKUP;
@@ -181,8 +182,24 @@ static void fuse_lookup_init(struct fuse_conn *fc, struct fuse_args *args,
args->in_args[2].size = 1;
args->in_args[2].value = "";
args->out_numargs = 1;
- args->out_args[0].size = sizeof(struct fuse_entry_out);
+ args->out_args[0].size = sizeof(*outarg) + outarg->fh.size;
args->out_args[0].value = outarg;
+
+ if (fc->lookup_handle) {
+ struct fuse_inode *fi = NULL;
+
+ args->opcode = FUSE_LOOKUP_HANDLE;
+ args->out_argvar = true;
+
+ if (dir)
+ fi = get_fuse_inode(dir);
+
+ if (fi && fi->fh) {
+ args->in_numargs = 4;
+ args->in_args[3].size = sizeof(*fi->fh) + fi->fh->size;
+ args->in_args[3].value = fi->fh;
+ }
+ }
}
/*
@@ -240,7 +257,7 @@ static int fuse_dentry_revalidate(struct inode *dir, const struct qstr *name,
attr_version = fuse_get_attr_version(fm->fc);
- fuse_lookup_init(fm->fc, &args, get_node_id(dir),
+ fuse_lookup_init(fm->fc, &args, get_node_id(dir), dir,
name, outarg);
ret = fuse_simple_request(fm, &args);
/* Zero nodeid is same as -ENOENT */
@@ -248,7 +265,8 @@ static int fuse_dentry_revalidate(struct inode *dir, const struct qstr *name,
ret = -ENOENT;
if (!ret) {
fi = get_fuse_inode(inode);
- if (outarg->nodeid != get_node_id(inode) ||
+ if (!fuse_file_handle_is_equal(fm->fc, fi->fh, &outarg->fh) ||
+ outarg->nodeid != get_node_id(inode) ||
(bool) IS_AUTOMOUNT(inode) != (bool) (outarg->attr.flags & FUSE_ATTR_SUBMOUNT)) {
fuse_queue_forget(fm->fc, forget,
outarg->nodeid, 1);
@@ -365,8 +383,9 @@ bool fuse_invalid_attr(struct fuse_attr *attr)
return !fuse_valid_type(attr->mode) || !fuse_valid_size(attr->size);
}
-int fuse_lookup_name(struct super_block *sb, u64 nodeid, const struct qstr *name,
- struct fuse_entry_out *outarg, struct inode **inode)
+int fuse_lookup_name(struct super_block *sb, u64 nodeid, struct inode *dir,
+ const struct qstr *name, struct fuse_entry_out *outarg,
+ struct inode **inode)
{
struct fuse_mount *fm = get_fuse_mount_super(sb);
FUSE_ARGS(args);
@@ -388,14 +407,15 @@ int fuse_lookup_name(struct super_block *sb, u64 nodeid, const struct qstr *name
attr_version = fuse_get_attr_version(fm->fc);
evict_ctr = fuse_get_evict_ctr(fm->fc);
- fuse_lookup_init(fm->fc, &args, nodeid, name, outarg);
+ fuse_lookup_init(fm->fc, &args, nodeid, dir, name, outarg);
err = fuse_simple_request(fm, &args);
/* Zero nodeid is same as -ENOENT, but with valid timeout */
- if (err || !outarg->nodeid)
+ if (err < 0 || !outarg->nodeid) // XXX err = size if args->out_argvar = true
goto out_put_forget;
err = -EIO;
- if (fuse_invalid_attr(&outarg->attr))
+ if (fuse_invalid_attr(&outarg->attr) ||
+ fuse_invalid_file_handle(fm->fc, &outarg->fh))
goto out_put_forget;
if (outarg->nodeid == FUSE_ROOT_ID && outarg->generation != 0) {
pr_warn_once("root generation should be zero\n");
@@ -404,7 +424,8 @@ int fuse_lookup_name(struct super_block *sb, u64 nodeid, const struct qstr *name
*inode = fuse_iget(sb, outarg->nodeid, outarg->generation,
&outarg->attr, ATTR_TIMEOUT(outarg),
- attr_version, evict_ctr);
+ attr_version, evict_ctr,
+ &outarg->fh);
err = -ENOMEM;
if (!*inode) {
fuse_queue_forget(fm->fc, forget, outarg->nodeid, 1);
@@ -440,14 +461,14 @@ static struct dentry *fuse_lookup(struct inode *dir, struct dentry *entry,
return ERR_PTR(-ENOMEM);
locked = fuse_lock_inode(dir);
- err = fuse_lookup_name(dir->i_sb, get_node_id(dir), &entry->d_name,
+ err = fuse_lookup_name(dir->i_sb, get_node_id(dir), dir, &entry->d_name,
outarg, &inode);
fuse_unlock_inode(dir, locked);
if (err == -ENOENT) {
outarg_valid = false;
err = 0;
}
- if (err)
+ if (err < 0) // XXX err = size if args->out_argvar = true
goto out_err;
err = -EIO;
@@ -689,24 +710,36 @@ static int fuse_create_open(struct mnt_idmap *idmap, struct inode *dir,
args.in_args[1].size = entry->d_name.len + 1;
args.in_args[1].value = entry->d_name.name;
args.out_numargs = 2;
- args.out_args[0].size = sizeof(*outentry);
+ args.out_args[0].size = sizeof(*outentry) + outentry->fh.size;
args.out_args[0].value = outentry;
/* Store outarg for fuse_finish_open() */
outopenp = &ff->args->open_outarg;
args.out_args[1].size = sizeof(*outopenp);
args.out_args[1].value = outopenp;
+ if (fm->fc->lookup_handle) {
+ fi = get_fuse_inode(dir);
+ args.out_argvar = true;
+ args.out_argvar_idx = 0;
+ if (fi->fh) {
+ args.in_numargs = 3;
+ args.in_args[2].size = sizeof(*fi->fh) + fi->fh->size;
+ args.in_args[2].value = fi->fh;
+ }
+ }
+
err = get_create_ext(idmap, &args, dir, entry, mode);
if (err)
goto out_free_outentry;
err = fuse_simple_idmap_request(idmap, fm, &args);
free_ext_value(&args);
- if (err)
+ if (err < 0) // XXX err = size if args->out_argvar = true
goto out_free_outentry;
err = -EIO;
if (!S_ISREG(outentry->attr.mode) || invalid_nodeid(outentry->nodeid) ||
+ fuse_invalid_file_handle(fm->fc, &outentry->fh) ||
fuse_invalid_attr(&outentry->attr))
goto out_free_outentry;
@@ -714,7 +747,8 @@ static int fuse_create_open(struct mnt_idmap *idmap, struct inode *dir,
ff->nodeid = outentry->nodeid;
ff->open_flags = outopenp->open_flags;
inode = fuse_iget(dir->i_sb, outentry->nodeid, outentry->generation,
- &outentry->attr, ATTR_TIMEOUT(outentry), 0, 0);
+ &outentry->attr, ATTR_TIMEOUT(outentry), 0, 0,
+ &outentry->fh);
if (!inode) {
flags &= ~(O_CREAT | O_EXCL | O_TRUNC);
fuse_sync_release(NULL, ff, flags);
@@ -830,9 +864,22 @@ static struct dentry *create_new_entry(struct mnt_idmap *idmap, struct fuse_moun
args->nodeid = get_node_id(dir);
args->out_numargs = 1;
- args->out_args[0].size = sizeof(*outarg);
+ args->out_args[0].size = sizeof(*outarg) + outarg->fh.size;
args->out_args[0].value = outarg;
+ if (fm->fc->lookup_handle) {
+ struct fuse_inode *fi = get_fuse_inode(dir);
+ int idx = args->in_numargs;
+
+ args->out_argvar = true;
+ args->out_argvar_idx = 0;
+ if (fi->fh && !WARN_ON_ONCE(idx >= 4)) {
+ args->in_args[idx].size = sizeof(*fi->fh) + fi->fh->size;
+ args->in_args[idx].value = fi->fh;
+ args->in_numargs++;
+ }
+ }
+
if (args->opcode != FUSE_LINK) {
err = get_create_ext(idmap, args, dir, entry, mode);
if (err)
@@ -841,18 +888,20 @@ static struct dentry *create_new_entry(struct mnt_idmap *idmap, struct fuse_moun
err = fuse_simple_idmap_request(idmap, fm, args);
free_ext_value(args);
- if (err)
+ if (err < 0) // XXX err = size if args->out_argvar = true
goto out_free_outarg;
err = -EIO;
- if (invalid_nodeid(outarg->nodeid) || fuse_invalid_attr(&outarg->attr))
+ if (invalid_nodeid(outarg->nodeid) || fuse_invalid_attr(&outarg->attr) ||
+ fuse_invalid_file_handle(fm->fc, &outarg->fh))
goto out_free_outarg;
if ((outarg->attr.mode ^ mode) & S_IFMT)
goto out_free_outarg;
inode = fuse_iget(dir->i_sb, outarg->nodeid, outarg->generation,
- &outarg->attr, ATTR_TIMEOUT(outarg), 0, 0);
+ &outarg->attr, ATTR_TIMEOUT(outarg), 0, 0,
+ &outarg->fh);
if (!inode) {
fuse_queue_forget(fm->fc, forget, outarg->nodeid, 1);
kfree(outarg);
diff --git a/fs/fuse/fuse_i.h b/fs/fuse/fuse_i.h
index fad05fae7e54..d0f3c81b5612 100644
--- a/fs/fuse/fuse_i.h
+++ b/fs/fuse/fuse_i.h
@@ -216,6 +216,8 @@ struct fuse_inode {
* so preserve the blocksize specified by the server.
*/
u8 cached_i_blkbits;
+
+ struct fuse_file_handle *fh;
};
/** FUSE inode state bits */
@@ -1067,6 +1069,26 @@ static inline int invalid_nodeid(u64 nodeid)
return !nodeid || nodeid == FUSE_ROOT_ID;
}
+static inline bool fuse_invalid_file_handle(struct fuse_conn *fc,
+ struct fuse_file_handle *handle)
+{
+ if (!fc->lookup_handle)
+ return false;
+
+ return !handle->size || (handle->size >= FUSE_MAX_HANDLE_SZ);
+}
+
+static inline bool fuse_file_handle_is_equal(struct fuse_conn *fc,
+ struct fuse_file_handle *fh1,
+ struct fuse_file_handle *fh2)
+{
+ if (!fc->lookup_handle || !fh2->size || // XXX more OPs without handle
+ ((fh1->size == fh2->size) &&
+ (!memcmp(fh1->handle, fh2->handle, fh1->size))))
+ return true;
+ return false;
+}
+
static inline u64 fuse_get_attr_version(struct fuse_conn *fc)
{
return atomic64_read(&fc->attr_version);
@@ -1098,7 +1120,10 @@ static inline struct fuse_entry_out *fuse_entry_out_alloc(struct fuse_conn *fc)
{
struct fuse_entry_out *entryout;
- entryout = kzalloc(sizeof(*entryout), GFP_KERNEL_ACCOUNT);
+ entryout = kzalloc(sizeof(*entryout) + fc->max_handle_sz,
+ GFP_KERNEL_ACCOUNT);
+ if (entryout)
+ entryout->fh.size = fc->max_handle_sz;
return entryout;
}
@@ -1145,10 +1170,11 @@ extern const struct dentry_operations fuse_dentry_operations;
struct inode *fuse_iget(struct super_block *sb, u64 nodeid,
int generation, struct fuse_attr *attr,
u64 attr_valid, u64 attr_version,
- u64 evict_ctr);
+ u64 evict_ctr, struct fuse_file_handle *fh);
-int fuse_lookup_name(struct super_block *sb, u64 nodeid, const struct qstr *name,
- struct fuse_entry_out *outarg, struct inode **inode);
+int fuse_lookup_name(struct super_block *sb, u64 nodeid, struct inode *dir,
+ const struct qstr *name, struct fuse_entry_out *outarg,
+ struct inode **inode);
/**
* Send FORGET command
diff --git a/fs/fuse/inode.c b/fs/fuse/inode.c
index bc84e7ed1e3d..f565f7e8118d 100644
--- a/fs/fuse/inode.c
+++ b/fs/fuse/inode.c
@@ -95,6 +95,25 @@ static struct fuse_submount_lookup *fuse_alloc_submount_lookup(void)
return NULL;
}
+/*
+ * XXX postpone this allocation and later use the real size instead of max
+ */
+static bool fuse_inode_handle_alloc(struct super_block *sb,
+ struct fuse_inode *fi)
+{
+ struct fuse_conn *fc = get_fuse_conn_super(sb);
+
+ fi->fh = NULL;
+ if (fc->lookup_handle) {
+ fi->fh = kzalloc(sizeof(*fi->fh) + fc->max_handle_sz,
+ GFP_KERNEL_ACCOUNT);
+ if (!fi->fh)
+ return false;
+ }
+
+ return true;
+}
+
static struct inode *fuse_alloc_inode(struct super_block *sb)
{
struct fuse_inode *fi;
@@ -120,8 +139,15 @@ static struct inode *fuse_alloc_inode(struct super_block *sb)
if (IS_ENABLED(CONFIG_FUSE_PASSTHROUGH))
fuse_inode_backing_set(fi, NULL);
+ if (!fuse_inode_handle_alloc(sb, fi))
+ goto out_free_dax;
+
return &fi->inode;
+out_free_dax:
+#ifdef CONFIG_FUSE_DAX
+ kfree(fi->dax);
+#endif
out_free_forget:
kfree(fi->forget);
out_free:
@@ -132,6 +158,7 @@ static struct inode *fuse_alloc_inode(struct super_block *sb)
static void fuse_free_inode(struct inode *inode)
{
struct fuse_inode *fi = get_fuse_inode(inode);
+ struct fuse_conn *fc = get_fuse_conn(inode);
mutex_destroy(&fi->mutex);
kfree(fi->forget);
@@ -141,6 +168,9 @@ static void fuse_free_inode(struct inode *inode)
if (IS_ENABLED(CONFIG_FUSE_PASSTHROUGH))
fuse_backing_put(fuse_inode_backing(fi));
+ if (fc->lookup_handle)
+ kfree(fi->fh);
+
kmem_cache_free(fuse_inode_cachep, fi);
}
@@ -465,7 +495,7 @@ static int fuse_inode_set(struct inode *inode, void *_nodeidp)
struct inode *fuse_iget(struct super_block *sb, u64 nodeid,
int generation, struct fuse_attr *attr,
u64 attr_valid, u64 attr_version,
- u64 evict_ctr)
+ u64 evict_ctr, struct fuse_file_handle *fh)
{
struct inode *inode;
struct fuse_inode *fi;
@@ -505,6 +535,30 @@ struct inode *fuse_iget(struct super_block *sb, u64 nodeid,
if (!inode)
return NULL;
+ fi = get_fuse_inode(inode);
+ if (fc->lookup_handle) {
+ if ((fh == NULL) && (nodeid != FUSE_ROOT_ID)) {
+ pr_err("NULL file handle for nodeid %llu\n", nodeid);
+ iput(inode);
+ return NULL;
+ }
+ if (fi->fh->size)
+ pr_warn_ratelimited(
+ "Handle already set for nodeid %llu (size: %u)\n",
+ nodeid, fi->fh->size);
+ if (fh) {
+ if (fh->size >= fc->max_handle_sz) {
+ pr_err("File handle too big (%u)\n", fh->size);
+ iput(inode);
+ return NULL;
+ }
+ fi->fh->size = fh->size;
+ memcpy(fi->fh->handle, fh->handle, fi->fh->size);
+ } else {
+ fi->fh->size = 0;
+ memset(fi->fh, 0, fc->max_handle_sz);
+ }
+ }
if ((inode->i_state & I_NEW)) {
inode->i_flags |= S_NOATIME;
if (!fc->writeback_cache || !S_ISREG(attr->mode))
@@ -512,7 +566,8 @@ struct inode *fuse_iget(struct super_block *sb, u64 nodeid,
inode->i_generation = generation;
fuse_init_inode(inode, attr, fc);
unlock_new_inode(inode);
- } else if (fuse_stale_inode(inode, generation, attr)) {
+ } else if (fuse_stale_inode(inode, generation, attr) ||
+ !fuse_file_handle_is_equal(fc, fi->fh, fh)) {
/* nodeid was reused, any I/O on the old inode should fail */
fuse_make_bad(inode);
if (inode != d_inode(sb->s_root)) {
@@ -521,7 +576,6 @@ struct inode *fuse_iget(struct super_block *sb, u64 nodeid,
goto retry;
}
}
- fi = get_fuse_inode(inode);
spin_lock(&fi->lock);
fi->nlookup++;
spin_unlock(&fi->lock);
@@ -1059,7 +1113,7 @@ static struct inode *fuse_get_root_inode(struct super_block *sb, unsigned int mo
attr.mode = mode;
attr.ino = FUSE_ROOT_ID;
attr.nlink = 1;
- return fuse_iget(sb, FUSE_ROOT_ID, 0, &attr, 0, 0, 0);
+ return fuse_iget(sb, FUSE_ROOT_ID, 0, &attr, 0, 0, 0, NULL); // XXX
}
struct fuse_inode_handle {
@@ -1092,7 +1146,7 @@ static struct dentry *fuse_get_dentry(struct super_block *sb,
goto out_err;
}
- err = fuse_lookup_name(sb, handle->nodeid, &name, outarg,
+ err = fuse_lookup_name(sb, handle->nodeid, NULL, &name, outarg,
&inode);
kfree(outarg);
if (err && err != -ENOENT)
@@ -1199,7 +1253,7 @@ static struct dentry *fuse_get_parent(struct dentry *child)
return ERR_PTR(-ENOMEM);
err = fuse_lookup_name(child_inode->i_sb, get_node_id(child_inode),
- &dotdot_name, outarg, &inode);
+ child_inode, &dotdot_name, outarg, &inode);
kfree(outarg);
if (err) {
if (err == -ENOENT)
@@ -1757,8 +1811,9 @@ static int fuse_fill_super_submount(struct super_block *sb,
return -ENOMEM;
fuse_fill_attr_from_inode(&root_attr, parent_fi);
+ /* XXX using parent fh */
root = fuse_iget(sb, parent_fi->nodeid, 0, &root_attr, 0, 0,
- fuse_get_evict_ctr(fm->fc));
+ fuse_get_evict_ctr(fm->fc), parent_fi->fh);
/*
* This inode is just a duplicate, so it is not looked up and
* its nlookup should not be incremented. fuse_iget() does
diff --git a/fs/fuse/readdir.c b/fs/fuse/readdir.c
index c2aae2eef086..04fb6636c4c0 100644
--- a/fs/fuse/readdir.c
+++ b/fs/fuse/readdir.c
@@ -185,12 +185,12 @@ static int fuse_direntplus_link(struct file *file,
return 0;
}
- if (invalid_nodeid(o->nodeid))
- return -EIO;
- if (fuse_invalid_attr(&o->attr))
+ fc = get_fuse_conn(dir);
+
+ if (invalid_nodeid(o->nodeid) || fuse_invalid_attr(&o->attr) ||
+ fuse_invalid_file_handle(fc, &o->fh))
return -EIO;
- fc = get_fuse_conn(dir);
epoch = atomic_read(&fc->epoch);
name.hash = full_name_hash(parent, name.name, name.len);
@@ -235,7 +235,7 @@ static int fuse_direntplus_link(struct file *file,
} else {
inode = fuse_iget(dir->i_sb, o->nodeid, o->generation,
&o->attr, ATTR_TIMEOUT(o),
- attr_version, evict_ctr);
+ attr_version, evict_ctr, &o->fh);
if (!inode)
inode = ERR_PTR(-ENOMEM);
diff --git a/include/uapi/linux/fuse.h b/include/uapi/linux/fuse.h
index 4acf71b407c9..b75744d2d75d 100644
--- a/include/uapi/linux/fuse.h
+++ b/include/uapi/linux/fuse.h
@@ -690,6 +690,13 @@ enum fuse_notify_code {
#define FUSE_MIN_READ_BUFFER 8192
#define FUSE_COMPAT_ENTRY_OUT_SIZE 120
+#define FUSE_COMPAT_45_ENTRY_OUT_SIZE 128
+
+struct fuse_file_handle {
+ uint32_t size;
+ uint32_t type;
+ char handle[0];
+};
struct fuse_entry_out {
uint64_t nodeid; /* Inode ID */
@@ -700,6 +707,7 @@ struct fuse_entry_out {
uint32_t entry_valid_nsec;
uint32_t attr_valid_nsec;
struct fuse_attr attr;
+ struct fuse_file_handle fh;
};
struct fuse_forget_in {
© 2016 - 2025 Red Hat, Inc.