From: Khalid Aziz <khalid.aziz@oracle.com>
To: akpm@linux-foundation.org, willy@infradead.org,
longpeng2@huawei.com, arnd@arndb.de, dave.hansen@linux.intel.com,
david@redhat.com, rppt@kernel.org, surenb@google.com,
linux-kernel@vger.kernel.org, linux-mm@kvack.org
Cc: Khalid Aziz <khalid.aziz@oracle.com>
Subject: [RFC PATCH 4/6] mm: implement mshare_unlink syscall
Date: Tue, 18 Jan 2022 14:19:16 -0700 [thread overview]
Message-ID: <afc1eed3b9095b279c4439a3627afa4973bad007.1642526745.git.khalid.aziz@oracle.com> (raw)
In-Reply-To: <cover.1642526745.git.khalid.aziz@oracle.com>
Add code to allow mshare syscall to be made for an exisitng mshare'd
region. Complete the implementation for mshare_unlink syscall. Make
reading mshare resource name from userspace safer. Fix code to allow
msharefs to be unmounted cleanly.
Signed-off-by: Khalid Aziz <khalid.aziz@oracle.com>
---
mm/mshare.c | 144 +++++++++++++++++++++++++++++++++++++++++-----------
1 file changed, 113 insertions(+), 31 deletions(-)
diff --git a/mm/mshare.c b/mm/mshare.c
index d998b23c25ab..8273136363cc 100644
--- a/mm/mshare.c
+++ b/mm/mshare.c
@@ -22,11 +22,24 @@
struct mshare_data {
struct mm_struct *mm;
+ mode_t mode;
refcount_t refcnt;
};
static struct super_block *msharefs_sb;
+static void
+msharefs_evict_inode(struct inode *inode)
+{
+ clear_inode(inode);
+}
+
+static const struct super_operations msharefs_ops = {
+ .statfs = simple_statfs,
+ .drop_inode = generic_delete_inode,
+ .evict_inode = msharefs_evict_inode,
+};
+
static ssize_t
mshare_read(struct kiocb *iocb, struct iov_iter *iov)
{
@@ -114,7 +127,7 @@ static struct inode
}
static int
-mshare_file_create(const char *name, unsigned long flags,
+mshare_file_create(struct filename *fname, int flags,
struct mshare_data *info)
{
struct inode *inode;
@@ -123,13 +136,16 @@ mshare_file_create(const char *name, unsigned long flags,
root = msharefs_sb->s_root;
+ /*
+ * This is a read only file.
+ */
inode = msharefs_get_inode(msharefs_sb, S_IFREG | 0400);
if (IS_ERR(inode))
return PTR_ERR(inode);
inode->i_private = info;
- dentry = msharefs_alloc_dentry(root, name);
+ dentry = msharefs_alloc_dentry(root, fname->name);
if (IS_ERR(dentry)) {
err = PTR_ERR(dentry);
goto fail_inode;
@@ -137,6 +153,7 @@ mshare_file_create(const char *name, unsigned long flags,
d_add(dentry, inode);
+ dput(dentry);
return err;
fail_inode:
@@ -150,10 +167,13 @@ mshare_file_create(const char *name, unsigned long flags,
SYSCALL_DEFINE5(mshare, const char __user *, name, unsigned long, addr,
unsigned long, len, int, oflag, mode_t, mode)
{
- char mshare_name[NAME_MAX];
struct mshare_data *info;
struct mm_struct *mm;
- int err;
+ struct filename *fname = getname(name);
+ struct dentry *dentry;
+ struct inode *inode;
+ struct qstr namestr;
+ int err = PTR_ERR(fname);
/*
* Address range being shared must be aligned to pgdir
@@ -162,29 +182,56 @@ SYSCALL_DEFINE5(mshare, const char __user *, name, unsigned long, addr,
if ((addr | len) & (PGDIR_SIZE - 1))
return -EINVAL;
- err = copy_from_user(mshare_name, name, NAME_MAX);
+ if (IS_ERR(fname))
+ goto err_out;
+
+ /*
+ * Does this mshare entry exist already? If it does, calling
+ * mshare with O_EXCL|O_CREAT is an error
+ */
+ namestr.name = fname->name;
+ namestr.len = strlen(fname->name);
+ err = msharefs_d_hash(msharefs_sb->s_root, &namestr);
if (err)
goto err_out;
+ dentry = d_lookup(msharefs_sb->s_root, &namestr);
+ if (dentry && (oflag & (O_EXCL|O_CREAT))) {
+ err = -EEXIST;
+ dput(dentry);
+ goto err_out;
+ }
- mm = mm_alloc();
- if (!mm)
- return -ENOMEM;
- info = kzalloc(sizeof(*info), GFP_KERNEL);
- if (!info) {
- err = -ENOMEM;
- goto err_relmm;
+ if (dentry) {
+ inode = d_inode(dentry);
+ if (inode == NULL) {
+ err = -EINVAL;
+ goto err_out;
+ }
+ info = inode->i_private;
+ refcount_inc(&info->refcnt);
+ dput(dentry);
+ } else {
+ mm = mm_alloc();
+ if (!mm)
+ return -ENOMEM;
+ info = kzalloc(sizeof(*info), GFP_KERNEL);
+ if (!info) {
+ err = -ENOMEM;
+ goto err_relmm;
+ }
+ mm->mmap_base = addr;
+ mm->task_size = addr + len;
+ if (!mm->task_size)
+ mm->task_size--;
+ info->mm = mm;
+ info->mode = mode;
+ refcount_set(&info->refcnt, 1);
+ err = mshare_file_create(fname, oflag, info);
+ if (err)
+ goto err_relinfo;
}
- mm->mmap_base = addr;
- mm->task_size = addr + len;
- if (!mm->task_size)
- mm->task_size--;
- info->mm = mm;
- refcount_set(&info->refcnt, 1);
-
- err = mshare_file_create(mshare_name, oflag, info);
- if (err)
- goto err_relinfo;
+ putname(fname);
return 0;
err_relinfo:
@@ -192,6 +239,7 @@ SYSCALL_DEFINE5(mshare, const char __user *, name, unsigned long, addr,
err_relmm:
mmput(mm);
err_out:
+ putname(fname);
return err;
}
@@ -200,21 +248,54 @@ SYSCALL_DEFINE5(mshare, const char __user *, name, unsigned long, addr,
*/
SYSCALL_DEFINE1(mshare_unlink, const char *, name)
{
- char mshare_name[NAME_MAX];
- int err;
+ struct filename *fname = getname(name);
+ int err = PTR_ERR(fname);
+ struct dentry *dentry;
+ struct inode *inode;
+ struct mshare_data *info;
+ struct qstr namestr;
- /*
- * Delete the named object
- *
- * TODO: Mark mshare'd range for deletion
- *
- */
- err = copy_from_user(mshare_name, name, NAME_MAX);
+ if (IS_ERR(fname))
+ goto err_out;
+
+ namestr.name = fname->name;
+ namestr.len = strlen(fname->name);
+ err = msharefs_d_hash(msharefs_sb->s_root, &namestr);
if (err)
goto err_out;
+ dentry = d_lookup(msharefs_sb->s_root, &namestr);
+ if (dentry == NULL) {
+ err = -EINVAL;
+ goto err_out;
+ }
+
+ inode = d_inode(dentry);
+ if (inode == NULL) {
+ err = -EINVAL;
+ goto err_dput;
+ }
+ info = inode->i_private;
+
+ /*
+ * Is this the last reference?
+ */
+ if (refcount_dec_and_test(&info->refcnt)) {
+ simple_unlink(d_inode(msharefs_sb->s_root), dentry);
+ d_drop(dentry);
+ d_delete(dentry);
+ mmput(info->mm);
+ kfree(info);
+ } else {
+ dput(dentry);
+ }
+
+ putname(fname);
return 0;
+err_dput:
+ dput(dentry);
err_out:
+ putname(fname);
return err;
}
@@ -228,6 +309,7 @@ msharefs_fill_super(struct super_block *sb, struct fs_context *fc)
static const struct tree_descr empty_descr = {""};
int err;
+ sb->s_op = &msharefs_ops;
sb->s_d_op = &msharefs_d_ops;
err = simple_fill_super(sb, MSHARE_MAGIC, &empty_descr);
if (err)
--
2.32.0
next prev parent reply other threads:[~2022-01-18 21:20 UTC|newest]
Thread overview: 54+ messages / expand[flat|nested] mbox.gz Atom feed top
2022-01-18 21:19 [RFC PATCH 0/6] Add support for shared PTEs across processes Khalid Aziz
2022-01-18 21:19 ` [RFC PATCH 1/6] mm: Add new system calls mshare, mshare_unlink Khalid Aziz
2022-01-18 21:19 ` [RFC PATCH 2/6] mm: Add msharefs filesystem Khalid Aziz
2022-01-18 21:19 ` [RFC PATCH 3/6] mm: Add read for msharefs Khalid Aziz
2022-01-18 21:19 ` Khalid Aziz [this message]
2022-01-18 21:19 ` [RFC PATCH 5/6] mm: Add locking to msharefs syscalls Khalid Aziz
2022-01-18 21:19 ` [RFC PATCH 6/6] mm: Add basic page table sharing using mshare Khalid Aziz
2022-01-18 21:41 ` [RFC PATCH 0/6] Add support for shared PTEs across processes Dave Hansen
2022-01-18 21:46 ` Matthew Wilcox
2022-01-18 22:47 ` Khalid Aziz
2022-01-18 22:06 ` Dave Hansen
2022-01-18 22:52 ` Khalid Aziz
2022-01-19 11:38 ` Mark Hemment
2022-01-19 17:02 ` Khalid Aziz
2022-01-20 12:49 ` Mark Hemment
2022-01-20 19:15 ` Khalid Aziz
2022-01-24 15:15 ` Mark Hemment
2022-01-24 15:27 ` Matthew Wilcox
2022-01-24 22:20 ` Khalid Aziz
2022-01-21 1:08 ` Barry Song
2022-01-21 2:13 ` Matthew Wilcox
2022-01-21 7:35 ` Barry Song
2022-01-21 14:47 ` Matthew Wilcox
2022-01-21 16:41 ` Khalid Aziz
2022-01-22 1:39 ` Longpeng (Mike, Cloud Infrastructure Service Product Dept.)
2022-01-22 1:41 ` Matthew Wilcox
2022-01-22 10:18 ` Thomas Schoebel-Theuer
2022-01-22 16:09 ` Matthew Wilcox
2022-01-22 11:31 ` Mike Rapoport
2022-01-22 18:29 ` Andy Lutomirski
2022-01-24 18:48 ` Khalid Aziz
2022-01-24 19:45 ` Andy Lutomirski
2022-01-24 22:30 ` Khalid Aziz
2022-01-24 23:16 ` Andy Lutomirski
2022-01-24 23:44 ` Khalid Aziz
2022-01-25 11:42 ` Kirill A. Shutemov
2022-01-25 12:09 ` William Kucharski
2022-01-25 13:18 ` David Hildenbrand
2022-01-25 14:01 ` Kirill A. Shutemov
2022-01-25 13:23 ` Matthew Wilcox
2022-01-25 13:59 ` Kirill A. Shutemov
2022-01-25 14:09 ` Matthew Wilcox
2022-01-25 18:57 ` Kirill A. Shutemov
2022-01-25 18:59 ` Matthew Wilcox
2022-01-26 4:04 ` Matthew Wilcox
2022-01-26 10:16 ` David Hildenbrand
2022-01-26 13:38 ` Matthew Wilcox
2022-01-26 13:55 ` David Hildenbrand
2022-01-26 14:12 ` Matthew Wilcox
2022-01-26 14:30 ` David Hildenbrand
2022-01-26 14:12 ` Mike Rapoport
2022-01-26 13:42 ` Kirill A. Shutemov
2022-01-26 14:18 ` Mike Rapoport
2022-01-26 17:33 ` Khalid Aziz
Reply instructions:
You may reply publicly to this message via plain-text email
using any one of the following methods:
* Save the following mbox file, import it into your mail client,
and reply-to-all from there: mbox
Avoid top-posting and favor interleaved quoting:
https://en.wikipedia.org/wiki/Posting_style#Interleaved_style
* Reply using the --to, --cc, and --in-reply-to
switches of git-send-email(1):
git send-email \
--in-reply-to=afc1eed3b9095b279c4439a3627afa4973bad007.1642526745.git.khalid.aziz@oracle.com \
--to=khalid.aziz@oracle.com \
--cc=akpm@linux-foundation.org \
--cc=arnd@arndb.de \
--cc=dave.hansen@linux.intel.com \
--cc=david@redhat.com \
--cc=linux-kernel@vger.kernel.org \
--cc=linux-mm@kvack.org \
--cc=longpeng2@huawei.com \
--cc=rppt@kernel.org \
--cc=surenb@google.com \
--cc=willy@infradead.org \
/path/to/YOUR_REPLY
https://kernel.org/pub/software/scm/git/docs/git-send-email.html
* If your mail client supports setting the In-Reply-To header
via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line
before the message body.
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox;
as well as URLs for NNTP newsgroup(s).