mm: unconditionally close VMAs on error

Incorrect invocation of VMA callbacks when the VMA is no longer in a
consistent state is bug prone and risky to perform.

With regards to the important vm_ops->close() callback We have gone to
great lengths to try to track whether or not we ought to close VMAs.

Rather than doing so and risking making a mistake somewhere, instead
unconditionally close and reset vma->vm_ops to an empty dummy operations
set with a NULL .close operator.

We introduce a new function to do so - vma_close() - and simplify existing
vms logic which tracked whether we needed to close or not.

This simplifies the logic, avoids incorrect double-calling of the .close()
callback and allows us to update error paths to simply call vma_close()
unconditionally - making VMA closure idempotent.

Link: https://lkml.kernel.org/r/28e89dda96f68c505cb6f8e9fc9b57c3e9f74b42.1730224667.git.lorenzo.stoakes@oracle.com
Fixes: deb0f65628 ("mm/mmap: undo ->mmap() when arch_validate_flags() fails")
Signed-off-by: Lorenzo Stoakes <lorenzo.stoakes@oracle.com>
Reported-by: Jann Horn <jannh@google.com>
Reviewed-by: Vlastimil Babka <vbabka@suse.cz>
Reviewed-by: Liam R. Howlett <Liam.Howlett@oracle.com>
Reviewed-by: Jann Horn <jannh@google.com>
Cc: Andreas Larsson <andreas@gaisler.com>
Cc: Catalin Marinas <catalin.marinas@arm.com>
Cc: David S. Miller <davem@davemloft.net>
Cc: Helge Deller <deller@gmx.de>
Cc: James E.J. Bottomley <James.Bottomley@HansenPartnership.com>
Cc: Linus Torvalds <torvalds@linux-foundation.org>
Cc: Mark Brown <broonie@kernel.org>
Cc: Peter Xu <peterx@redhat.com>
Cc: Will Deacon <will@kernel.org>
Cc: <stable@vger.kernel.org>
Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
This commit is contained in:
Lorenzo Stoakes 2024-10-29 18:11:45 +00:00 committed by Andrew Morton
parent 3dd6ed34ce
commit 4080ef1579
5 changed files with 27 additions and 17 deletions

View File

@ -135,6 +135,24 @@ static inline int mmap_file(struct file *file, struct vm_area_struct *vma)
return err; return err;
} }
/*
* If the VMA has a close hook then close it, and since closing it might leave
* it in an inconsistent state which makes the use of any hooks suspect, clear
* them down by installing dummy empty hooks.
*/
static inline void vma_close(struct vm_area_struct *vma)
{
if (vma->vm_ops && vma->vm_ops->close) {
vma->vm_ops->close(vma);
/*
* The mapping is in an inconsistent state, and no further hooks
* may be invoked upon it.
*/
vma->vm_ops = &vma_dummy_vm_ops;
}
}
#ifdef CONFIG_MMU #ifdef CONFIG_MMU
/* Flags for folio_pte_batch(). */ /* Flags for folio_pte_batch(). */

View File

@ -1573,8 +1573,7 @@ expanded:
return addr; return addr;
close_and_free_vma: close_and_free_vma:
if (file && !vms.closed_vm_ops && vma->vm_ops && vma->vm_ops->close) vma_close(vma);
vma->vm_ops->close(vma);
if (file || vma->vm_file) { if (file || vma->vm_file) {
unmap_and_free_vma: unmap_and_free_vma:
@ -1934,7 +1933,7 @@ void exit_mmap(struct mm_struct *mm)
do { do {
if (vma->vm_flags & VM_ACCOUNT) if (vma->vm_flags & VM_ACCOUNT)
nr_accounted += vma_pages(vma); nr_accounted += vma_pages(vma);
remove_vma(vma, /* unreachable = */ true, /* closed = */ false); remove_vma(vma, /* unreachable = */ true);
count++; count++;
cond_resched(); cond_resched();
vma = vma_next(&vmi); vma = vma_next(&vmi);

View File

@ -589,8 +589,7 @@ static int delete_vma_from_mm(struct vm_area_struct *vma)
*/ */
static void delete_vma(struct mm_struct *mm, struct vm_area_struct *vma) static void delete_vma(struct mm_struct *mm, struct vm_area_struct *vma)
{ {
if (vma->vm_ops && vma->vm_ops->close) vma_close(vma);
vma->vm_ops->close(vma);
if (vma->vm_file) if (vma->vm_file)
fput(vma->vm_file); fput(vma->vm_file);
put_nommu_region(vma->vm_region); put_nommu_region(vma->vm_region);

View File

@ -323,11 +323,10 @@ static bool can_vma_merge_right(struct vma_merge_struct *vmg,
/* /*
* Close a vm structure and free it. * Close a vm structure and free it.
*/ */
void remove_vma(struct vm_area_struct *vma, bool unreachable, bool closed) void remove_vma(struct vm_area_struct *vma, bool unreachable)
{ {
might_sleep(); might_sleep();
if (!closed && vma->vm_ops && vma->vm_ops->close) vma_close(vma);
vma->vm_ops->close(vma);
if (vma->vm_file) if (vma->vm_file)
fput(vma->vm_file); fput(vma->vm_file);
mpol_put(vma_policy(vma)); mpol_put(vma_policy(vma));
@ -1115,9 +1114,7 @@ void vms_clean_up_area(struct vma_munmap_struct *vms,
vms_clear_ptes(vms, mas_detach, true); vms_clear_ptes(vms, mas_detach, true);
mas_set(mas_detach, 0); mas_set(mas_detach, 0);
mas_for_each(mas_detach, vma, ULONG_MAX) mas_for_each(mas_detach, vma, ULONG_MAX)
if (vma->vm_ops && vma->vm_ops->close) vma_close(vma);
vma->vm_ops->close(vma);
vms->closed_vm_ops = true;
} }
/* /*
@ -1160,7 +1157,7 @@ void vms_complete_munmap_vmas(struct vma_munmap_struct *vms,
/* Remove and clean up vmas */ /* Remove and clean up vmas */
mas_set(mas_detach, 0); mas_set(mas_detach, 0);
mas_for_each(mas_detach, vma, ULONG_MAX) mas_for_each(mas_detach, vma, ULONG_MAX)
remove_vma(vma, /* = */ false, vms->closed_vm_ops); remove_vma(vma, /* unreachable = */ false);
vm_unacct_memory(vms->nr_accounted); vm_unacct_memory(vms->nr_accounted);
validate_mm(mm); validate_mm(mm);
@ -1684,8 +1681,7 @@ struct vm_area_struct *copy_vma(struct vm_area_struct **vmap,
return new_vma; return new_vma;
out_vma_link: out_vma_link:
if (new_vma->vm_ops && new_vma->vm_ops->close) vma_close(new_vma);
new_vma->vm_ops->close(new_vma);
if (new_vma->vm_file) if (new_vma->vm_file)
fput(new_vma->vm_file); fput(new_vma->vm_file);

View File

@ -42,7 +42,6 @@ struct vma_munmap_struct {
int vma_count; /* Number of vmas that will be removed */ int vma_count; /* Number of vmas that will be removed */
bool unlock; /* Unlock after the munmap */ bool unlock; /* Unlock after the munmap */
bool clear_ptes; /* If there are outstanding PTE to be cleared */ bool clear_ptes; /* If there are outstanding PTE to be cleared */
bool closed_vm_ops; /* call_mmap() was encountered, so vmas may be closed */
/* 1 byte hole */ /* 1 byte hole */
unsigned long nr_pages; /* Number of pages being removed */ unsigned long nr_pages; /* Number of pages being removed */
unsigned long locked_vm; /* Number of locked pages */ unsigned long locked_vm; /* Number of locked pages */
@ -198,7 +197,6 @@ static inline void init_vma_munmap(struct vma_munmap_struct *vms,
vms->unmap_start = FIRST_USER_ADDRESS; vms->unmap_start = FIRST_USER_ADDRESS;
vms->unmap_end = USER_PGTABLES_CEILING; vms->unmap_end = USER_PGTABLES_CEILING;
vms->clear_ptes = false; vms->clear_ptes = false;
vms->closed_vm_ops = false;
} }
#endif #endif
@ -269,7 +267,7 @@ int do_vmi_munmap(struct vma_iterator *vmi, struct mm_struct *mm,
unsigned long start, size_t len, struct list_head *uf, unsigned long start, size_t len, struct list_head *uf,
bool unlock); bool unlock);
void remove_vma(struct vm_area_struct *vma, bool unreachable, bool closed); void remove_vma(struct vm_area_struct *vma, bool unreachable);
void unmap_region(struct ma_state *mas, struct vm_area_struct *vma, void unmap_region(struct ma_state *mas, struct vm_area_struct *vma,
struct vm_area_struct *prev, struct vm_area_struct *next); struct vm_area_struct *prev, struct vm_area_struct *next);