[PATCH v2 07/20] mm/mshare: Add mmap support
From: Anthony Yznaga
Date: Thu Apr 03 2025 - 22:20:25 EST
From: Khalid Aziz <khalid@xxxxxxxxxx>
Add support for mapping an mshare region into a process after the
region has been established in msharefs. Disallow operations that
could split the resulting msharefs vma such as partial unmaps and
protection changes. Fault handling, mapping, unmapping, and
protection changes for objects mapped into an mshare region will
be done using the shared vmas created for them in the host mm. This
functionality will be added in later patches.
Signed-off-by: Khalid Aziz <khalid@xxxxxxxxxx>
Signed-off-by: Anthony Yznaga <anthony.yznaga@xxxxxxxxxx>
---
mm/mshare.c | 133 +++++++++++++++++++++++++++++++++++++++++++++++++++-
1 file changed, 132 insertions(+), 1 deletion(-)
diff --git a/mm/mshare.c b/mm/mshare.c
index 5eed18bc3b51..6bdbcfa8deea 100644
--- a/mm/mshare.c
+++ b/mm/mshare.c
@@ -15,19 +15,146 @@
#include <linux/fs.h>
#include <linux/fs_context.h>
+#include <linux/mman.h>
#include <uapi/linux/magic.h>
#include <linux/falloc.h>
const unsigned long mshare_align = P4D_SIZE;
+const unsigned long mshare_base = mshare_align;
#define MSHARE_INITIALIZED 0x1
struct mshare_data {
struct mm_struct *mm;
+ unsigned long start;
unsigned long size;
unsigned long flags;
};
+static int mshare_vm_op_split(struct vm_area_struct *vma, unsigned long addr)
+{
+ return -EINVAL;
+}
+
+static int mshare_vm_op_mprotect(struct vm_area_struct *vma, unsigned long start,
+ unsigned long end, unsigned long newflags)
+{
+ return -EINVAL;
+}
+
+static const struct vm_operations_struct msharefs_vm_ops = {
+ .may_split = mshare_vm_op_split,
+ .mprotect = mshare_vm_op_mprotect,
+};
+
+/*
+ * msharefs_mmap() - mmap an mshare region
+ */
+static int
+msharefs_mmap(struct file *file, struct vm_area_struct *vma)
+{
+ struct mshare_data *m_data = file->private_data;
+
+ vma->vm_private_data = m_data;
+ vm_flags_set(vma, VM_MSHARE | VM_DONTEXPAND);
+ vma->vm_ops = &msharefs_vm_ops;
+
+ return 0;
+}
+
+static unsigned long
+msharefs_get_unmapped_area_bottomup(struct file *file, unsigned long addr,
+ unsigned long len, unsigned long pgoff, unsigned long flags)
+{
+ struct vm_unmapped_area_info info = {};
+
+ info.length = len;
+ info.low_limit = current->mm->mmap_base;
+ info.high_limit = arch_get_mmap_end(addr, len, flags);
+ info.align_mask = PAGE_MASK & (mshare_align - 1);
+ return vm_unmapped_area(&info);
+}
+
+static unsigned long
+msharefs_get_unmapped_area_topdown(struct file *file, unsigned long addr,
+ unsigned long len, unsigned long pgoff, unsigned long flags)
+{
+ struct vm_unmapped_area_info info = {};
+
+ info.flags = VM_UNMAPPED_AREA_TOPDOWN;
+ info.length = len;
+ info.low_limit = PAGE_SIZE;
+ info.high_limit = arch_get_mmap_base(addr, current->mm->mmap_base);
+ info.align_mask = PAGE_MASK & (mshare_align - 1);
+ addr = vm_unmapped_area(&info);
+
+ /*
+ * A failed mmap() very likely causes application failure,
+ * so fall back to the bottom-up function here. This scenario
+ * can happen with large stack limits and large mmap()
+ * allocations.
+ */
+ if (unlikely(offset_in_page(addr))) {
+ VM_BUG_ON(addr != -ENOMEM);
+ info.flags = 0;
+ info.low_limit = current->mm->mmap_base;
+ info.high_limit = arch_get_mmap_end(addr, len, flags);
+ addr = vm_unmapped_area(&info);
+ }
+
+ return addr;
+}
+
+static unsigned long
+msharefs_get_unmapped_area(struct file *file, unsigned long addr,
+ unsigned long len, unsigned long pgoff, unsigned long flags)
+{
+ struct mshare_data *m_data = file->private_data;
+ struct mm_struct *mm = current->mm;
+ struct vm_area_struct *vma, *prev;
+ unsigned long mshare_start, mshare_size;
+ const unsigned long mmap_end = arch_get_mmap_end(addr, len, flags);
+
+ mmap_assert_write_locked(mm);
+
+ if ((flags & MAP_TYPE) == MAP_PRIVATE)
+ return -EINVAL;
+
+ if (!test_bit(MSHARE_INITIALIZED, &m_data->flags))
+ return -EINVAL;
+
+ mshare_start = m_data->start;
+ mshare_size = m_data->size;
+
+ if (len != mshare_size)
+ return -EINVAL;
+
+ if (len > mmap_end - mmap_min_addr)
+ return -ENOMEM;
+
+ if (flags & MAP_FIXED) {
+ if (!IS_ALIGNED(addr, mshare_align))
+ return -EINVAL;
+ return addr;
+ }
+
+ if (addr) {
+ addr = ALIGN(addr, mshare_align);
+ vma = find_vma_prev(mm, addr, &prev);
+ if (mmap_end - len >= addr && addr >= mmap_min_addr &&
+ (!vma || addr + len <= vm_start_gap(vma)) &&
+ (!prev || addr >= vm_end_gap(prev)))
+ return addr;
+ }
+
+ if (!test_bit(MMF_TOPDOWN, &mm->flags))
+ return msharefs_get_unmapped_area_bottomup(file, addr, len,
+ pgoff, flags);
+ else
+ return msharefs_get_unmapped_area_topdown(file, addr, len,
+ pgoff, flags);
+}
+
static int msharefs_set_size(struct mshare_data *m_data, unsigned long size)
{
int error = -EINVAL;
@@ -81,6 +208,8 @@ static const struct inode_operations msharefs_file_inode_ops;
static const struct file_operations msharefs_file_operations = {
.open = simple_open,
+ .mmap = msharefs_mmap,
+ .get_unmapped_area = msharefs_get_unmapped_area,
.fallocate = msharefs_fallocate,
};
@@ -97,7 +226,8 @@ msharefs_fill_mm(struct inode *inode)
goto err_free;
}
- mm->mmap_base = mm->task_size = 0;
+ mm->mmap_base = mshare_base;
+ mm->task_size = 0;
m_data = kzalloc(sizeof(*m_data), GFP_KERNEL);
if (!m_data) {
@@ -105,6 +235,7 @@ msharefs_fill_mm(struct inode *inode)
goto err_free;
}
m_data->mm = mm;
+ m_data->start = mshare_base;
inode->i_private = m_data;
return 0;
--
2.43.5