!3059 Handle more faults under the VMA lock (39622c1a) · Commits · EulixOS / Software / Kernel

mm/filemap.c

+7 −6

Original line number	Diff line number	Diff line
		@@ -3104,7 +3104,7 @@ static int lock_folio_maybe_drop_mmap(struct vm_fault vmf, struct folio folio,

		/*
		* NOTE! This will make us return with VM_FAULT_RETRY, but with
		* the mmap_lock still held. That's how FAULT_FLAG_RETRY_NOWAIT
		* the fault lock still held. That's how FAULT_FLAG_RETRY_NOWAIT
		* is supposed to work. We have way too many special cases..
		*/
		if (vmf->flags & FAULT_FLAG_RETRY_NOWAIT)
		@@ -3114,13 +3114,14 @@ static int lock_folio_maybe_drop_mmap(struct vm_fault vmf, struct folio folio,
		if (vmf->flags & FAULT_FLAG_KILLABLE) {
		if (__folio_lock_killable(folio)) {
		/*
		* We didn't have the right flags to drop the mmap_lock,
		* but all fault_handlers only check for fatal signals
		* if we return VM_FAULT_RETRY, so we need to drop the
		* mmap_lock here and return 0 if we don't have a fpin.
		* We didn't have the right flags to drop the
		* fault lock, but all fault_handlers only check
		* for fatal signals if we return VM_FAULT_RETRY,
		* so we need to drop the fault lock here and
		* return 0 if we don't have a fpin.
		*/
		if (*fpin == NULL)
		mmap_read_unlock(vmf->vma->vm_mm);
		release_fault_lock(vmf);
		return 0;
		}
		} else

mm/memory.c

+58 −35

Original line number	Diff line number	Diff line
		@@ -3044,6 +3044,36 @@ static inline void wp_page_reuse(struct vm_fault vmf, struct folio folio)
		count_vm_event(PGREUSE);
		}

		/*
		* We could add a bitflag somewhere, but for now, we know that all
		* vm_ops that have a ->map_pages have been audited and don't need
		* the mmap_lock to be held.
		*/
		static inline vm_fault_t vmf_can_call_fault(const struct vm_fault *vmf)
		{
		struct vm_area_struct *vma = vmf->vma;

		if (vma->vm_ops->map_pages \|\| !(vmf->flags & FAULT_FLAG_VMA_LOCK))
		return 0;
		vma_end_read(vma);
		return VM_FAULT_RETRY;
		}

		static vm_fault_t vmf_anon_prepare(struct vm_fault *vmf)
		{
		struct vm_area_struct *vma = vmf->vma;

		if (likely(vma->anon_vma))
		return 0;
		if (vmf->flags & FAULT_FLAG_VMA_LOCK) {
		vma_end_read(vma);
		return VM_FAULT_RETRY;
		}
		if (__anon_vma_prepare(vma))
		return VM_FAULT_OOM;
		return 0;
		}

		/*
		* Handle the case of a page which we actually need to copy to a new page,
		* either due to COW or unsharing.
		@@ -3071,27 +3101,29 @@ static vm_fault_t wp_page_copy(struct vm_fault *vmf)
		pte_t entry;
		int page_copied = 0;
		struct mmu_notifier_range range;
		int ret;
		vm_fault_t ret;

		delayacct_wpcopy_start();

		if (vmf->page)
		old_folio = page_folio(vmf->page);
		if (unlikely(anon_vma_prepare(vma)))
		goto oom;
		ret = vmf_anon_prepare(vmf);
		if (unlikely(ret))
		goto out;

		if (is_zero_pfn(pte_pfn(vmf->orig_pte))) {
		new_folio = vma_alloc_zeroed_movable_folio(vma, vmf->address);
		if (!new_folio)
		goto oom;
		} else {
		int err;
		new_folio = vma_alloc_folio(GFP_HIGHUSER_MOVABLE, 0, vma,
		vmf->address, false);
		if (!new_folio)
		goto oom;

		ret = __wp_page_copy_user(&new_folio->page, vmf->page, vmf);
		if (ret) {
		err = __wp_page_copy_user(&new_folio->page, vmf->page, vmf);
		if (err) {
		/*
		* COW failed, if the fault was solved by other,
		* it's fine. If not, userspace would re-fault on
		@@ -3104,7 +3136,7 @@ static vm_fault_t wp_page_copy(struct vm_fault *vmf)
		folio_put(old_folio);

		delayacct_wpcopy_end();
		return ret == -EHWPOISON ? VM_FAULT_HWPOISON : 0;
		return err == -EHWPOISON ? VM_FAULT_HWPOISON : 0;
		}
		kmsan_copy_page_meta(&new_folio->page, vmf->page);
		}
		@@ -3214,11 +3246,13 @@ static vm_fault_t wp_page_copy(struct vm_fault *vmf)
		oom_free_new:
		folio_put(new_folio);
		oom:
		ret = VM_FAULT_OOM;
		out:
		if (old_folio)
		folio_put(old_folio);

		delayacct_wpcopy_end();
		return VM_FAULT_OOM;
		return ret;
		}

		/**
		@@ -3270,10 +3304,9 @@ static vm_fault_t wp_pfn_shared(struct vm_fault *vmf)
		vm_fault_t ret;

		pte_unmap_unlock(vmf->pte, vmf->ptl);
		if (vmf->flags & FAULT_FLAG_VMA_LOCK) {
		vma_end_read(vmf->vma);
		return VM_FAULT_RETRY;
		}
		ret = vmf_can_call_fault(vmf);
		if (ret)
		return ret;

		vmf->flags \|= FAULT_FLAG_MKWRITE;
		ret = vma->vm_ops->pfn_mkwrite(vmf);
		@@ -3297,10 +3330,10 @@ static vm_fault_t wp_page_shared(struct vm_fault vmf, struct folio folio)
		vm_fault_t tmp;

		pte_unmap_unlock(vmf->pte, vmf->ptl);
		if (vmf->flags & FAULT_FLAG_VMA_LOCK) {
		tmp = vmf_can_call_fault(vmf);
		if (tmp) {
		folio_put(folio);
		vma_end_read(vmf->vma);
		return VM_FAULT_RETRY;
		return tmp;
		}

		tmp = do_page_mkwrite(vmf, folio);
		@@ -3444,12 +3477,6 @@ static vm_fault_t do_wp_page(struct vm_fault *vmf)
		return 0;
		}
		copy:
		if ((vmf->flags & FAULT_FLAG_VMA_LOCK) && !vma->anon_vma) {
		pte_unmap_unlock(vmf->pte, vmf->ptl);
		vma_end_read(vmf->vma);
		return VM_FAULT_RETRY;
		}

		/*
		* Ok, we need to copy. Oh, well..
		*/
		@@ -4575,10 +4602,9 @@ static vm_fault_t do_read_fault(struct vm_fault *vmf)
		return ret;
		}

		if (vmf->flags & FAULT_FLAG_VMA_LOCK) {
		vma_end_read(vmf->vma);
		return VM_FAULT_RETRY;
		}
		ret = vmf_can_call_fault(vmf);
		if (ret)
		return ret;

		ret = __do_fault(vmf);
		if (unlikely(ret & (VM_FAULT_ERROR \| VM_FAULT_NOPAGE \| VM_FAULT_RETRY)))
		@@ -4597,13 +4623,11 @@ static vm_fault_t do_cow_fault(struct vm_fault *vmf)
		struct vm_area_struct *vma = vmf->vma;
		vm_fault_t ret;

		if (vmf->flags & FAULT_FLAG_VMA_LOCK) {
		vma_end_read(vma);
		return VM_FAULT_RETRY;
		}

		if (unlikely(anon_vma_prepare(vma)))
		return VM_FAULT_OOM;
		ret = vmf_can_call_fault(vmf);
		if (!ret)
		ret = vmf_anon_prepare(vmf);
		if (ret)
		return ret;

		vmf->cow_page = alloc_page_vma(GFP_HIGHUSER_MOVABLE, vma, vmf->address);
		if (!vmf->cow_page)
		@@ -4642,10 +4666,9 @@ static vm_fault_t do_shared_fault(struct vm_fault *vmf)
		vm_fault_t ret, tmp;
		struct folio *folio;

		if (vmf->flags & FAULT_FLAG_VMA_LOCK) {
		vma_end_read(vma);
		return VM_FAULT_RETRY;
		}
		ret = vmf_can_call_fault(vmf);
		if (ret)
		return ret;

		ret = __do_fault(vmf);
		if (unlikely(ret & (VM_FAULT_ERROR \| VM_FAULT_NOPAGE \| VM_FAULT_RETRY)))