forked from mirrors/linux
		
	 5e31275cc9
			
		
	
	
		5e31275cc9
		
	
	
	
	
		
			
			Introduce per-VMA locking.  The lock implementation relies on a per-vma
and per-mm sequence counters to note exclusive locking:
  - read lock - (implemented by vma_start_read) requires the vma
    (vm_lock_seq) and mm (mm_lock_seq) sequence counters to differ.
    If they match then there must be a vma exclusive lock held somewhere.
  - read unlock - (implemented by vma_end_read) is a trivial vma->lock
    unlock.
  - write lock - (vma_start_write) requires the mmap_lock to be held
    exclusively and the current mm counter is assigned to the vma counter.
    This will allow multiple vmas to be locked under a single mmap_lock
    write lock (e.g. during vma merging). The vma counter is modified
    under exclusive vma lock.
  - write unlock - (vma_end_write_all) is a batch release of all vma
    locks held. It doesn't pair with a specific vma_start_write! It is
    done before exclusive mmap_lock is released by incrementing mm
    sequence counter (mm_lock_seq).
  - write downgrade - if the mmap_lock is downgraded to the read lock, all
    vma write locks are released as well (effectivelly same as write
    unlock).
Link: https://lkml.kernel.org/r/20230227173632.3292573-13-surenb@google.com
Signed-off-by: Suren Baghdasaryan <surenb@google.com>
Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
		
	
			
		
			
				
	
	
		
			183 lines
		
	
	
	
		
			4.6 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			183 lines
		
	
	
	
		
			4.6 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
| #ifndef _LINUX_MMAP_LOCK_H
 | |
| #define _LINUX_MMAP_LOCK_H
 | |
| 
 | |
| #include <linux/lockdep.h>
 | |
| #include <linux/mm_types.h>
 | |
| #include <linux/mmdebug.h>
 | |
| #include <linux/rwsem.h>
 | |
| #include <linux/tracepoint-defs.h>
 | |
| #include <linux/types.h>
 | |
| 
 | |
| #define MMAP_LOCK_INITIALIZER(name) \
 | |
| 	.mmap_lock = __RWSEM_INITIALIZER((name).mmap_lock),
 | |
| 
 | |
| DECLARE_TRACEPOINT(mmap_lock_start_locking);
 | |
| DECLARE_TRACEPOINT(mmap_lock_acquire_returned);
 | |
| DECLARE_TRACEPOINT(mmap_lock_released);
 | |
| 
 | |
| #ifdef CONFIG_TRACING
 | |
| 
 | |
| void __mmap_lock_do_trace_start_locking(struct mm_struct *mm, bool write);
 | |
| void __mmap_lock_do_trace_acquire_returned(struct mm_struct *mm, bool write,
 | |
| 					   bool success);
 | |
| void __mmap_lock_do_trace_released(struct mm_struct *mm, bool write);
 | |
| 
 | |
| static inline void __mmap_lock_trace_start_locking(struct mm_struct *mm,
 | |
| 						   bool write)
 | |
| {
 | |
| 	if (tracepoint_enabled(mmap_lock_start_locking))
 | |
| 		__mmap_lock_do_trace_start_locking(mm, write);
 | |
| }
 | |
| 
 | |
| static inline void __mmap_lock_trace_acquire_returned(struct mm_struct *mm,
 | |
| 						      bool write, bool success)
 | |
| {
 | |
| 	if (tracepoint_enabled(mmap_lock_acquire_returned))
 | |
| 		__mmap_lock_do_trace_acquire_returned(mm, write, success);
 | |
| }
 | |
| 
 | |
| static inline void __mmap_lock_trace_released(struct mm_struct *mm, bool write)
 | |
| {
 | |
| 	if (tracepoint_enabled(mmap_lock_released))
 | |
| 		__mmap_lock_do_trace_released(mm, write);
 | |
| }
 | |
| 
 | |
| #else /* !CONFIG_TRACING */
 | |
| 
 | |
| static inline void __mmap_lock_trace_start_locking(struct mm_struct *mm,
 | |
| 						   bool write)
 | |
| {
 | |
| }
 | |
| 
 | |
| static inline void __mmap_lock_trace_acquire_returned(struct mm_struct *mm,
 | |
| 						      bool write, bool success)
 | |
| {
 | |
| }
 | |
| 
 | |
| static inline void __mmap_lock_trace_released(struct mm_struct *mm, bool write)
 | |
| {
 | |
| }
 | |
| 
 | |
| #endif /* CONFIG_TRACING */
 | |
| 
 | |
| static inline void mmap_assert_locked(struct mm_struct *mm)
 | |
| {
 | |
| 	lockdep_assert_held(&mm->mmap_lock);
 | |
| 	VM_BUG_ON_MM(!rwsem_is_locked(&mm->mmap_lock), mm);
 | |
| }
 | |
| 
 | |
| static inline void mmap_assert_write_locked(struct mm_struct *mm)
 | |
| {
 | |
| 	lockdep_assert_held_write(&mm->mmap_lock);
 | |
| 	VM_BUG_ON_MM(!rwsem_is_locked(&mm->mmap_lock), mm);
 | |
| }
 | |
| 
 | |
| #ifdef CONFIG_PER_VMA_LOCK
 | |
| static inline void vma_end_write_all(struct mm_struct *mm)
 | |
| {
 | |
| 	mmap_assert_write_locked(mm);
 | |
| 	/* No races during update due to exclusive mmap_lock being held */
 | |
| 	WRITE_ONCE(mm->mm_lock_seq, mm->mm_lock_seq + 1);
 | |
| }
 | |
| #else
 | |
| static inline void vma_end_write_all(struct mm_struct *mm) {}
 | |
| #endif
 | |
| 
 | |
| static inline void mmap_init_lock(struct mm_struct *mm)
 | |
| {
 | |
| 	init_rwsem(&mm->mmap_lock);
 | |
| }
 | |
| 
 | |
| static inline void mmap_write_lock(struct mm_struct *mm)
 | |
| {
 | |
| 	__mmap_lock_trace_start_locking(mm, true);
 | |
| 	down_write(&mm->mmap_lock);
 | |
| 	__mmap_lock_trace_acquire_returned(mm, true, true);
 | |
| }
 | |
| 
 | |
| static inline void mmap_write_lock_nested(struct mm_struct *mm, int subclass)
 | |
| {
 | |
| 	__mmap_lock_trace_start_locking(mm, true);
 | |
| 	down_write_nested(&mm->mmap_lock, subclass);
 | |
| 	__mmap_lock_trace_acquire_returned(mm, true, true);
 | |
| }
 | |
| 
 | |
| static inline int mmap_write_lock_killable(struct mm_struct *mm)
 | |
| {
 | |
| 	int ret;
 | |
| 
 | |
| 	__mmap_lock_trace_start_locking(mm, true);
 | |
| 	ret = down_write_killable(&mm->mmap_lock);
 | |
| 	__mmap_lock_trace_acquire_returned(mm, true, ret == 0);
 | |
| 	return ret;
 | |
| }
 | |
| 
 | |
| static inline bool mmap_write_trylock(struct mm_struct *mm)
 | |
| {
 | |
| 	bool ret;
 | |
| 
 | |
| 	__mmap_lock_trace_start_locking(mm, true);
 | |
| 	ret = down_write_trylock(&mm->mmap_lock) != 0;
 | |
| 	__mmap_lock_trace_acquire_returned(mm, true, ret);
 | |
| 	return ret;
 | |
| }
 | |
| 
 | |
| static inline void mmap_write_unlock(struct mm_struct *mm)
 | |
| {
 | |
| 	__mmap_lock_trace_released(mm, true);
 | |
| 	vma_end_write_all(mm);
 | |
| 	up_write(&mm->mmap_lock);
 | |
| }
 | |
| 
 | |
| static inline void mmap_write_downgrade(struct mm_struct *mm)
 | |
| {
 | |
| 	__mmap_lock_trace_acquire_returned(mm, false, true);
 | |
| 	vma_end_write_all(mm);
 | |
| 	downgrade_write(&mm->mmap_lock);
 | |
| }
 | |
| 
 | |
| static inline void mmap_read_lock(struct mm_struct *mm)
 | |
| {
 | |
| 	__mmap_lock_trace_start_locking(mm, false);
 | |
| 	down_read(&mm->mmap_lock);
 | |
| 	__mmap_lock_trace_acquire_returned(mm, false, true);
 | |
| }
 | |
| 
 | |
| static inline int mmap_read_lock_killable(struct mm_struct *mm)
 | |
| {
 | |
| 	int ret;
 | |
| 
 | |
| 	__mmap_lock_trace_start_locking(mm, false);
 | |
| 	ret = down_read_killable(&mm->mmap_lock);
 | |
| 	__mmap_lock_trace_acquire_returned(mm, false, ret == 0);
 | |
| 	return ret;
 | |
| }
 | |
| 
 | |
| static inline bool mmap_read_trylock(struct mm_struct *mm)
 | |
| {
 | |
| 	bool ret;
 | |
| 
 | |
| 	__mmap_lock_trace_start_locking(mm, false);
 | |
| 	ret = down_read_trylock(&mm->mmap_lock) != 0;
 | |
| 	__mmap_lock_trace_acquire_returned(mm, false, ret);
 | |
| 	return ret;
 | |
| }
 | |
| 
 | |
| static inline void mmap_read_unlock(struct mm_struct *mm)
 | |
| {
 | |
| 	__mmap_lock_trace_released(mm, false);
 | |
| 	up_read(&mm->mmap_lock);
 | |
| }
 | |
| 
 | |
| static inline void mmap_read_unlock_non_owner(struct mm_struct *mm)
 | |
| {
 | |
| 	__mmap_lock_trace_released(mm, false);
 | |
| 	up_read_non_owner(&mm->mmap_lock);
 | |
| }
 | |
| 
 | |
| static inline int mmap_lock_is_contended(struct mm_struct *mm)
 | |
| {
 | |
| 	return rwsem_is_contended(&mm->mmap_lock);
 | |
| }
 | |
| 
 | |
| #endif /* _LINUX_MMAP_LOCK_H */
 |