From: Liam Howlett <liam.howlett@oracle.com>
To: "maple-tree@lists.infradead.org" <maple-tree@lists.infradead.org>,
"linux-mm@kvack.org" <linux-mm@kvack.org>,
"linux-kernel@vger.kernel.org" <linux-kernel@vger.kernel.org>,
Andrew Morton <akpm@linux-foundation.org>
Cc: "Matthew Wilcox (Oracle)" <willy@infradead.org>,
Yang Yingliang <yangyingliang@huawei.com>,
Liam Howlett <liam.howlett@oracle.com>,
Vlastimil Babka <vbabka@suse.cz>
Subject: [PATCH v14 65/70] nommu: remove uses of VMA linked list
Date: Tue, 6 Sep 2022 19:49:05 +0000 [thread overview]
Message-ID: <20220906194824.2110408-66-Liam.Howlett@oracle.com> (raw)
In-Reply-To: <20220906194824.2110408-1-Liam.Howlett@oracle.com>
From: "Matthew Wilcox (Oracle)" <willy@infradead.org>
Use the maple tree or VMA iterator instead. This is faster and will allow
us to shrink the VMA.
Signed-off-by: Matthew Wilcox (Oracle) <willy@infradead.org>
Signed-off-by: Liam R. Howlett <Liam.Howlett@Oracle.com>
Acked-by: Vlastimil Babka <vbabka@suse.cz>
---
mm/nommu.c | 146 +++++++++++++++++++++++++++++++++++++++--------------
1 file changed, 109 insertions(+), 37 deletions(-)
diff --git a/mm/nommu.c b/mm/nommu.c
index 265a444a2cc2..269df51e9226 100644
--- a/mm/nommu.c
+++ b/mm/nommu.c
@@ -557,26 +557,14 @@ void vma_mas_remove(struct vm_area_struct *vma, struct ma_state *mas)
mas_store_prealloc(mas, NULL);
}
-/*
- * add a VMA into a process's mm_struct in the appropriate place in the list
- * and tree and add to the address space's page tree also if not an anonymous
- * page
- * - should be called with mm->mmap_lock held writelocked
- */
-static void add_vma_to_mm(struct mm_struct *mm, struct vm_area_struct *vma)
+static void setup_vma_to_mm(struct vm_area_struct *vma, struct mm_struct *mm)
{
- struct address_space *mapping;
- struct vm_area_struct *prev;
- MA_STATE(mas, &mm->mm_mt, vma->vm_start, vma->vm_end);
-
- BUG_ON(!vma->vm_region);
-
mm->map_count++;
vma->vm_mm = mm;
/* add the VMA to the mapping */
if (vma->vm_file) {
- mapping = vma->vm_file->f_mapping;
+ struct address_space *mapping = vma->vm_file->f_mapping;
i_mmap_lock_write(mapping);
flush_dcache_mmap_lock(mapping);
@@ -584,21 +572,52 @@ static void add_vma_to_mm(struct mm_struct *mm, struct vm_area_struct *vma)
flush_dcache_mmap_unlock(mapping);
i_mmap_unlock_write(mapping);
}
+}
- prev = mas_prev(&mas, 0);
- mas_reset(&mas);
+/*
+ * mas_add_vma_to_mm() - Maple state variant of add_mas_to_mm().
+ * @mas: The maple state with preallocations.
+ * @mm: The mm_struct
+ * @vma: The vma to add
+ *
+ */
+static void mas_add_vma_to_mm(struct ma_state *mas, struct mm_struct *mm,
+ struct vm_area_struct *vma)
+{
+ struct vm_area_struct *prev;
+
+ BUG_ON(!vma->vm_region);
+
+ setup_vma_to_mm(vma, mm);
+
+ prev = mas_prev(mas, 0);
+ mas_reset(mas);
/* add the VMA to the tree */
- vma_mas_store(vma, &mas);
+ vma_mas_store(vma, mas);
__vma_link_list(mm, vma, prev);
}
/*
- * delete a VMA from its owning mm_struct and address space
+ * add a VMA into a process's mm_struct in the appropriate place in the list
+ * and tree and add to the address space's page tree also if not an anonymous
+ * page
+ * - should be called with mm->mmap_lock held writelocked
*/
-static void delete_vma_from_mm(struct vm_area_struct *vma)
+static int add_vma_to_mm(struct mm_struct *mm, struct vm_area_struct *vma)
{
- MA_STATE(mas, &vma->vm_mm->mm_mt, 0, 0);
+ MA_STATE(mas, &mm->mm_mt, vma->vm_start, vma->vm_end);
+
+ if (mas_preallocate(&mas, vma, GFP_KERNEL)) {
+ pr_warn("Allocation of vma tree for process %d failed\n",
+ current->pid);
+ return -ENOMEM;
+ }
+ mas_add_vma_to_mm(&mas, mm, vma);
+ return 0;
+}
+static void cleanup_vma_from_mm(struct vm_area_struct *vma)
+{
vma->vm_mm->map_count--;
/* remove the VMA from the mapping */
if (vma->vm_file) {
@@ -611,10 +630,25 @@ static void delete_vma_from_mm(struct vm_area_struct *vma)
flush_dcache_mmap_unlock(mapping);
i_mmap_unlock_write(mapping);
}
+}
+/*
+ * delete a VMA from its owning mm_struct and address space
+ */
+static int delete_vma_from_mm(struct vm_area_struct *vma)
+{
+ MA_STATE(mas, &vma->vm_mm->mm_mt, 0, 0);
+
+ if (mas_preallocate(&mas, vma, GFP_KERNEL)) {
+ pr_warn("Allocation of vma tree for process %d failed\n",
+ current->pid);
+ return -ENOMEM;
+ }
+ cleanup_vma_from_mm(vma);
/* remove from the MM's tree and list */
vma_mas_remove(vma, &mas);
__vma_unlink_list(vma->vm_mm, vma);
+ return 0;
}
/*
@@ -1024,6 +1058,7 @@ unsigned long do_mmap(struct file *file,
vm_flags_t vm_flags;
unsigned long capabilities, result;
int ret;
+ MA_STATE(mas, ¤t->mm->mm_mt, 0, 0);
*populate = 0;
@@ -1042,6 +1077,7 @@ unsigned long do_mmap(struct file *file,
* now know into VMA flags */
vm_flags = determine_vm_flags(file, prot, flags, capabilities);
+
/* we're going to need to record the mapping */
region = kmem_cache_zalloc(vm_region_jar, GFP_KERNEL);
if (!region)
@@ -1051,6 +1087,9 @@ unsigned long do_mmap(struct file *file,
if (!vma)
goto error_getting_vma;
+ if (mas_preallocate(&mas, vma, GFP_KERNEL))
+ goto error_maple_preallocate;
+
region->vm_usage = 1;
region->vm_flags = vm_flags;
region->vm_pgoff = pgoff;
@@ -1191,7 +1230,7 @@ unsigned long do_mmap(struct file *file,
current->mm->total_vm += len >> PAGE_SHIFT;
share:
- add_vma_to_mm(current->mm, vma);
+ mas_add_vma_to_mm(&mas, current->mm, vma);
/* we flush the region from the icache only when the first executable
* mapping of it is made */
@@ -1217,6 +1256,7 @@ unsigned long do_mmap(struct file *file,
sharing_violation:
up_write(&nommu_region_sem);
+ mas_destroy(&mas);
pr_warn("Attempt to share mismatched mappings\n");
ret = -EINVAL;
goto error;
@@ -1233,6 +1273,14 @@ unsigned long do_mmap(struct file *file,
len, current->pid);
show_free_areas(0, NULL);
return -ENOMEM;
+
+error_maple_preallocate:
+ kmem_cache_free(vm_region_jar, region);
+ vm_area_free(vma);
+ pr_warn("Allocation of vma tree for process %d failed\n", current->pid);
+ show_free_areas(0, NULL);
+ return -ENOMEM;
+
}
unsigned long ksys_mmap_pgoff(unsigned long addr, unsigned long len,
@@ -1298,6 +1346,7 @@ int split_vma(struct mm_struct *mm, struct vm_area_struct *vma,
struct vm_area_struct *new;
struct vm_region *region;
unsigned long npages;
+ MA_STATE(mas, &mm->mm_mt, vma->vm_start, vma->vm_end);
/* we're only permitted to split anonymous regions (these should have
* only a single usage on the region) */
@@ -1312,9 +1361,13 @@ int split_vma(struct mm_struct *mm, struct vm_area_struct *vma,
return -ENOMEM;
new = vm_area_dup(vma);
- if (!new) {
- kmem_cache_free(vm_region_jar, region);
- return -ENOMEM;
+ if (!new)
+ goto err_vma_dup;
+
+ if (mas_preallocate(&mas, vma, GFP_KERNEL)) {
+ pr_warn("Allocation of vma tree for process %d failed\n",
+ current->pid);
+ goto err_mas_preallocate;
}
/* most fields are the same, copy all, and then fixup */
@@ -1333,7 +1386,6 @@ int split_vma(struct mm_struct *mm, struct vm_area_struct *vma,
if (new->vm_ops && new->vm_ops->open)
new->vm_ops->open(new);
- delete_vma_from_mm(vma);
down_write(&nommu_region_sem);
delete_nommu_region(vma->vm_region);
if (new_below) {
@@ -1346,9 +1398,19 @@ int split_vma(struct mm_struct *mm, struct vm_area_struct *vma,
add_nommu_region(vma->vm_region);
add_nommu_region(new->vm_region);
up_write(&nommu_region_sem);
- add_vma_to_mm(mm, vma);
- add_vma_to_mm(mm, new);
+
+ setup_vma_to_mm(vma, mm);
+ setup_vma_to_mm(new, mm);
+ mas_set_range(&mas, vma->vm_start, vma->vm_end - 1);
+ mas_store(&mas, vma);
+ vma_mas_store(new, &mas);
return 0;
+
+err_mas_preallocate:
+ vm_area_free(new);
+err_vma_dup:
+ kmem_cache_free(vm_region_jar, region);
+ return -ENOMEM;
}
/*
@@ -1363,12 +1425,14 @@ static int shrink_vma(struct mm_struct *mm,
/* adjust the VMA's pointers, which may reposition it in the MM's tree
* and list */
- delete_vma_from_mm(vma);
+ if (delete_vma_from_mm(vma))
+ return -ENOMEM;
if (from > vma->vm_start)
vma->vm_end = from;
else
vma->vm_start = to;
- add_vma_to_mm(mm, vma);
+ if (add_vma_to_mm(mm, vma))
+ return -ENOMEM;
/* cut the backing region down to size */
region = vma->vm_region;
@@ -1396,9 +1460,10 @@ static int shrink_vma(struct mm_struct *mm,
*/
int do_munmap(struct mm_struct *mm, unsigned long start, size_t len, struct list_head *uf)
{
+ MA_STATE(mas, &mm->mm_mt, start, start);
struct vm_area_struct *vma;
unsigned long end;
- int ret;
+ int ret = 0;
len = PAGE_ALIGN(len);
if (len == 0)
@@ -1407,7 +1472,7 @@ int do_munmap(struct mm_struct *mm, unsigned long start, size_t len, struct list
end = start + len;
/* find the first potentially overlapping VMA */
- vma = find_vma(mm, start);
+ vma = mas_find(&mas, end - 1);
if (!vma) {
static int limit;
if (limit < 5) {
@@ -1426,7 +1491,7 @@ int do_munmap(struct mm_struct *mm, unsigned long start, size_t len, struct list
return -EINVAL;
if (end == vma->vm_end)
goto erase_whole_vma;
- vma = vma->vm_next;
+ vma = mas_next(&mas, end - 1);
} while (vma);
return -EINVAL;
} else {
@@ -1448,9 +1513,10 @@ int do_munmap(struct mm_struct *mm, unsigned long start, size_t len, struct list
}
erase_whole_vma:
- delete_vma_from_mm(vma);
+ if (delete_vma_from_mm(vma))
+ ret = -ENOMEM;
delete_vma(mm, vma);
- return 0;
+ return ret;
}
int vm_munmap(unsigned long addr, size_t len)
@@ -1475,6 +1541,7 @@ SYSCALL_DEFINE2(munmap, unsigned long, addr, size_t, len)
*/
void exit_mmap(struct mm_struct *mm)
{
+ VMA_ITERATOR(vmi, mm, 0);
struct vm_area_struct *vma;
if (!mm)
@@ -1482,13 +1549,18 @@ void exit_mmap(struct mm_struct *mm)
mm->total_vm = 0;
- while ((vma = mm->mmap)) {
- mm->mmap = vma->vm_next;
- delete_vma_from_mm(vma);
+ /*
+ * Lock the mm to avoid assert complaining even though this is the only
+ * user of the mm
+ */
+ mmap_write_lock(mm);
+ for_each_vma(vmi, vma) {
+ cleanup_vma_from_mm(vma);
delete_vma(mm, vma);
cond_resched();
}
__mt_destroy(&mm->mm_mt);
+ mmap_write_unlock(mm);
}
int vm_brk(unsigned long addr, unsigned long len)
--
2.35.1
next prev parent reply other threads:[~2022-09-06 19:50 UTC|newest]
Thread overview: 89+ messages / expand[flat|nested] mbox.gz Atom feed top
2022-09-06 19:48 [PATCH v14 00/70] Introducing the Maple Tree Liam Howlett
2022-09-06 19:48 ` [PATCH v14 02/70] radix tree test suite: add pr_err define Liam Howlett
2022-09-06 19:48 ` [PATCH v14 01/70] Maple Tree: add new data structure Liam Howlett
2022-09-12 8:42 ` Bagas Sanjaya
2022-09-14 10:16 ` Liam Howlett
2022-09-06 19:48 ` [PATCH v14 04/70] radix tree test suite: add allocation counts and size to kmem_cache Liam Howlett
2022-09-06 19:48 ` [PATCH v14 03/70] radix tree test suite: add kmem_cache_set_non_kernel() Liam Howlett
2022-09-06 19:48 ` [PATCH v14 05/70] radix tree test suite: add support for slab bulk APIs Liam Howlett
2022-09-06 19:48 ` [PATCH v14 06/70] radix tree test suite: add lockdep_is_held to header Liam Howlett
2022-09-06 19:48 ` [PATCH v14 07/70] lib/test_maple_tree: add testing for maple tree Liam Howlett
2022-10-11 12:16 ` Geert Uytterhoeven
2022-10-11 12:56 ` Matthew Wilcox
2022-10-11 12:59 ` Geert Uytterhoeven
2022-10-11 16:13 ` Liam Howlett
2022-09-06 19:48 ` [PATCH v14 08/70] mm: start tracking VMAs with " Liam Howlett
2022-09-06 19:48 ` [PATCH v14 11/70] mm/mmap: use the maple tree in find_vma() instead of the rbtree Liam Howlett
2022-09-06 19:48 ` [PATCH v14 10/70] mmap: use the VMA iterator in count_vma_pages_range() Liam Howlett
2022-09-06 19:48 ` [PATCH v14 09/70] mm: add VMA iterator Liam Howlett
2022-09-06 19:48 ` [PATCH v14 14/70] kernel/fork: use maple tree for dup_mmap() during forking Liam Howlett
2022-09-06 19:48 ` [PATCH v14 12/70] mm/mmap: use the maple tree for find_vma_prev() instead of the rbtree Liam Howlett
2022-09-06 19:48 ` [PATCH v14 13/70] mm/mmap: use maple tree for unmapped_area{_topdown} Liam Howlett
2022-09-06 19:48 ` [PATCH v14 17/70] mm: remove rb tree Liam Howlett
2022-09-06 19:48 ` [PATCH v14 16/70] proc: remove VMA rbtree use from nommu Liam Howlett
2022-09-06 19:48 ` [PATCH v14 15/70] damon: convert __damon_va_three_regions to use the VMA iterator Liam Howlett
2022-09-06 19:48 ` [PATCH v14 20/70] mm: optimize find_exact_vma() to use vma_lookup() Liam Howlett
2022-09-06 19:48 ` [PATCH v14 18/70] mmap: change zeroing of maple tree in __vma_adjust() Liam Howlett
2022-09-06 19:48 ` [PATCH v14 19/70] xen: use vma_lookup() in privcmd_ioctl_mmap() Liam Howlett
2022-09-06 19:48 ` [PATCH v14 22/70] mm/mmap: change do_brk_flags() to expand existing VMA and add do_brk_munmap() Liam Howlett
2022-09-06 19:48 ` [PATCH v14 21/70] mm/khugepaged: optimize collapse_pte_mapped_thp() by using vma_lookup() Liam Howlett
2022-09-06 19:48 ` [PATCH v14 23/70] mm: use maple tree operations for find_vma_intersection() Liam Howlett
2022-09-06 19:48 ` [PATCH v14 24/70] mm/mmap: use advanced maple tree API for mmap_region() Liam Howlett
2022-09-06 19:48 ` [PATCH v14 25/70] mm: remove vmacache Liam Howlett
2022-09-06 19:48 ` [PATCH v14 26/70] mm: convert vma_lookup() to use mtree_load() Liam Howlett
2022-09-06 19:48 ` [PATCH v14 28/70] mm/mmap: reorganize munmap to use maple states Liam Howlett
2022-09-06 19:48 ` [PATCH v14 27/70] mm/mmap: move mmap_region() below do_munmap() Liam Howlett
2022-09-06 19:48 ` [PATCH v14 29/70] mm/mmap: change do_brk_munmap() to use do_mas_align_munmap() Liam Howlett
2022-09-06 19:48 ` [PATCH v14 30/70] arm64: remove mmap linked list from vdso Liam Howlett
2022-09-06 19:48 ` [PATCH v14 31/70] arm64: Change elfcore for_each_mte_vma() to use VMA iterator Liam Howlett
2022-09-06 19:48 ` [PATCH v14 32/70] parisc: remove mmap linked list from cache handling Liam Howlett
2022-09-06 19:48 ` [PATCH v14 33/70] powerpc: remove mmap linked list walks Liam Howlett
2022-09-06 19:48 ` [PATCH v14 34/70] s390: remove vma " Liam Howlett
2022-09-06 19:48 ` [PATCH v14 35/70] x86: " Liam Howlett
2022-09-06 19:48 ` [PATCH v14 38/70] optee: remove vma linked list walk Liam Howlett
2022-09-06 19:48 ` [PATCH v14 36/70] xtensa: remove vma linked list walks Liam Howlett
2022-09-06 19:48 ` [PATCH v14 37/70] cxl: remove vma linked list walk Liam Howlett
2022-09-06 19:48 ` [PATCH v14 39/70] um: " Liam Howlett
2022-09-06 19:48 ` [PATCH v14 41/70] exec: use VMA iterator instead of linked list Liam Howlett
2022-09-06 19:48 ` [PATCH v14 40/70] coredump: remove vma linked list walk Liam Howlett
2022-09-06 19:48 ` [PATCH v14 42/70] fs/proc/base: use the vma iterators in place of linked list Liam Howlett
2022-09-06 19:48 ` [PATCH v14 43/70] fs/proc/task_mmu: stop using linked list and highest_vm_end Liam Howlett
2022-09-06 19:48 ` [PATCH v14 44/70] userfaultfd: use maple tree iterator to iterate VMAs Liam Howlett
2022-09-06 19:48 ` [PATCH v14 45/70] ipc/shm: use VMA iterator instead of linked list Liam Howlett
2022-09-06 19:48 ` [PATCH v14 46/70] acct: " Liam Howlett
2022-09-06 19:48 ` [PATCH v14 47/70] perf: use VMA iterator Liam Howlett
2022-09-06 19:48 ` [PATCH v14 50/70] bpf: remove VMA linked list Liam Howlett
2022-09-06 19:48 ` [PATCH v14 49/70] fork: use VMA iterator Liam Howlett
2022-09-06 19:48 ` [PATCH v14 48/70] sched: use maple tree iterator to walk VMAs Liam Howlett
2022-09-06 19:49 ` [PATCH v14 52/70] mm/khugepaged: stop using vma linked list Liam Howlett
2022-09-06 19:49 ` [PATCH v14 51/70] mm/gup: use maple tree navigation instead of " Liam Howlett
2022-09-06 19:49 ` [PATCH v14 55/70] mm/memcontrol: stop using mm->highest_vm_end Liam Howlett
2022-09-06 19:49 ` [PATCH v14 54/70] mm/madvise: use vma_find() instead of vma linked list Liam Howlett
2022-09-06 19:49 ` [PATCH v14 53/70] mm/ksm: use vma iterators " Liam Howlett
2022-09-06 19:49 ` [PATCH v14 57/70] mm/mlock: use vma iterator and maple state " Liam Howlett
2022-09-06 19:49 ` [PATCH v14 56/70] mm/mempolicy: use vma iterator & " Liam Howlett
2022-09-06 19:49 ` [PATCH v14 58/70] mm/mprotect: use maple tree navigation instead of VMA " Liam Howlett
2022-09-06 19:49 ` [PATCH v14 59/70] mm/mremap: use vma_find_intersection() instead of vma " Liam Howlett
2022-09-06 19:49 ` [PATCH v14 60/70] mm/msync: use vma_find() " Liam Howlett
2022-09-06 19:49 ` [PATCH v14 61/70] mm/oom_kill: use vma iterators " Liam Howlett
2022-09-06 19:49 ` [PATCH v14 64/70] i915: use the VMA iterator Liam Howlett
2022-09-06 19:49 ` [PATCH v14 63/70] mm/swapfile: use vma iterator instead of vma linked list Liam Howlett
2022-09-06 19:49 ` [PATCH v14 62/70] mm/pagewalk: use vma_find() " Liam Howlett
2022-09-06 19:49 ` Liam Howlett [this message]
2022-09-06 19:49 ` [PATCH v14 67/70] mm/vmscan: Use vma iterator instead of vm_next Liam Howlett
2022-09-12 6:55 ` Yu Zhao
2022-09-12 7:13 ` Yu Zhao
2022-09-12 7:14 ` Liam Howlett
2022-09-12 19:45 ` Andrew Morton
2022-09-12 20:01 ` Yu Zhao
2022-09-12 21:03 ` Andrew Morton
2022-09-13 3:39 ` Yu Zhao
2022-09-06 19:49 ` [PATCH v14 66/70] riscv: use vma iterator for vdso Liam Howlett
2022-09-06 19:49 ` [PATCH v14 70/70] mm/mmap.c: pass in mapping to __vma_link_file() Liam Howlett
2022-09-06 19:49 ` [PATCH v14 68/70] mm: remove the vma linked list Liam Howlett
2022-09-06 19:49 ` [PATCH v14 69/70] mm/mmap: drop range_has_overlap() function Liam Howlett
2022-09-06 23:51 ` [PATCH v14 00/70] Introducing the Maple Tree Andrew Morton
2022-09-07 0:24 ` Liam Howlett
2022-09-12 0:20 ` Andrew Morton
2022-09-15 18:03 ` Yu Zhao
2022-09-17 8:24 ` Yu Zhao
Reply instructions:
You may reply publicly to this message via plain-text email
using any one of the following methods:
* Save the following mbox file, import it into your mail client,
and reply-to-all from there: mbox
Avoid top-posting and favor interleaved quoting:
https://en.wikipedia.org/wiki/Posting_style#Interleaved_style
* Reply using the --to, --cc, and --in-reply-to
switches of git-send-email(1):
git send-email \
--in-reply-to=20220906194824.2110408-66-Liam.Howlett@oracle.com \
--to=liam.howlett@oracle.com \
--cc=akpm@linux-foundation.org \
--cc=linux-kernel@vger.kernel.org \
--cc=linux-mm@kvack.org \
--cc=maple-tree@lists.infradead.org \
--cc=vbabka@suse.cz \
--cc=willy@infradead.org \
--cc=yangyingliang@huawei.com \
/path/to/YOUR_REPLY
https://kernel.org/pub/software/scm/git/docs/git-send-email.html
* If your mail client supports setting the In-Reply-To header
via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line
before the message body.
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox;
as well as URLs for NNTP newsgroup(s).