linux_dsm_epyc7002/arch/sparc/mm/gup.c

/*
 * Lockless get_user_pages_fast for sparc, cribbed from powerpc
 *
 * Copyright (C) 2008 Nick Piggin
 * Copyright (C) 2008 Novell Inc.
 */

#include <linux/sched.h>
#include <linux/mm.h>
#include <linux/vmstat.h>
#include <linux/pagemap.h>
#include <linux/rwsem.h>
#include <asm/pgtable.h>

/*
 * The performance critical leaf functions are made noinline otherwise gcc
 * inlines everything into a single function which results in too much
 * register pressure.
 */
static noinline int gup_pte_range(pmd_t pmd, unsigned long addr,
		unsigned long end, int write, struct page **pages, int *nr)
{
	unsigned long mask, result;
	pte_t *ptep;

	if (tlb_type == hypervisor) {
		result = _PAGE_PRESENT_4V|_PAGE_P_4V;
		if (write)
			result |= _PAGE_WRITE_4V;
	} else {
		result = _PAGE_PRESENT_4U|_PAGE_P_4U;
		if (write)
			result |= _PAGE_WRITE_4U;
	}
	mask = result | _PAGE_SPECIAL;

	ptep = pte_offset_kernel(&pmd, addr);
	do {
		struct page *page, *head;
		pte_t pte = *ptep;

		if ((pte_val(pte) & mask) != result)
			return 0;
		VM_BUG_ON(!pfn_valid(pte_pfn(pte)));

		/* The hugepage case is simplified on sparc64 because
		 * we encode the sub-page pfn offsets into the
		 * hugepage PTEs.  We could optimize this in the future
		 * use page_cache_add_speculative() for the hugepage case.
		 */
		page = pte_page(pte);
		head = compound_head(page);
		if (!page_cache_get_speculative(head))
			return 0;
		if (unlikely(pte_val(pte) != pte_val(*ptep))) {
			put_page(head);
			return 0;
		}

		pages[*nr] = page;
		(*nr)++;
	} while (ptep++, addr += PAGE_SIZE, addr != end);

	return 1;
}

static int gup_huge_pmd(pmd_t *pmdp, pmd_t pmd, unsigned long addr,
			unsigned long end, int write, struct page **pages,
			int *nr)
{
	struct page *head, *page;
	int refs;

	if (!(pmd_val(pmd) & _PAGE_VALID))
		return 0;

	if (write && !pmd_write(pmd))
		return 0;

	refs = 0;
	page = pmd_page(pmd) + ((addr & ~PMD_MASK) >> PAGE_SHIFT);
	head = compound_head(page);
	do {
		VM_BUG_ON(compound_head(page) != head);
		pages[*nr] = page;
		(*nr)++;
		page++;
		refs++;
	} while (addr += PAGE_SIZE, addr != end);

	if (!page_cache_add_speculative(head, refs)) {
		*nr -= refs;
		return 0;
	}

	if (unlikely(pmd_val(pmd) != pmd_val(*pmdp))) {
		*nr -= refs;
		while (refs--)
			put_page(head);
		return 0;
	}

	return 1;
}

static int gup_pmd_range(pud_t pud, unsigned long addr, unsigned long end,
		int write, struct page **pages, int *nr)
{
	unsigned long next;
	pmd_t *pmdp;

	pmdp = pmd_offset(&pud, addr);
	do {
		pmd_t pmd = *pmdp;

		next = pmd_addr_end(addr, end);
		if (pmd_none(pmd))
			return 0;
		if (unlikely(pmd_large(pmd))) {
			if (!gup_huge_pmd(pmdp, pmd, addr, next,
					  write, pages, nr))
				return 0;
		} else if (!gup_pte_range(pmd, addr, next, write,
					  pages, nr))
			return 0;
	} while (pmdp++, addr = next, addr != end);

	return 1;
}

static int gup_pud_range(pgd_t pgd, unsigned long addr, unsigned long end,
		int write, struct page **pages, int *nr)
{
	unsigned long next;
	pud_t *pudp;

	pudp = pud_offset(&pgd, addr);
	do {
		pud_t pud = *pudp;

		next = pud_addr_end(addr, end);
		if (pud_none(pud))
			return 0;
		if (!gup_pmd_range(pud, addr, next, write, pages, nr))
			return 0;
	} while (pudp++, addr = next, addr != end);

	return 1;
}

int __get_user_pages_fast(unsigned long start, int nr_pages, int write,
			  struct page **pages)
{
	struct mm_struct *mm = current->mm;
	unsigned long addr, len, end;
	unsigned long next, flags;
	pgd_t *pgdp;
	int nr = 0;

	start &= PAGE_MASK;
	addr = start;
	len = (unsigned long) nr_pages << PAGE_SHIFT;
	end = start + len;

	local_irq_save(flags);
	pgdp = pgd_offset(mm, addr);
	do {
		pgd_t pgd = *pgdp;

		next = pgd_addr_end(addr, end);
		if (pgd_none(pgd))
			break;
		if (!gup_pud_range(pgd, addr, next, write, pages, &nr))
			break;
	} while (pgdp++, addr = next, addr != end);
	local_irq_restore(flags);

	return nr;
}

int get_user_pages_fast(unsigned long start, int nr_pages, int write,
			struct page **pages)
{
	struct mm_struct *mm = current->mm;
	unsigned long addr, len, end;
	unsigned long next;
	pgd_t *pgdp;
	int nr = 0;

	start &= PAGE_MASK;
	addr = start;
	len = (unsigned long) nr_pages << PAGE_SHIFT;
	end = start + len;

	/*
	 * XXX: batch / limit 'nr', to avoid large irq off latency
	 * needs some instrumenting to determine the common sizes used by
	 * important workloads (eg. DB2), and whether limiting the batch size
	 * will decrease performance.
	 *
	 * It seems like we're in the clear for the moment. Direct-IO is
	 * the main guy that batches up lots of get_user_pages, and even
	 * they are limited to 64-at-a-time which is not so many.
	 */
	/*
	 * This doesn't prevent pagetable teardown, but does prevent
	 * the pagetables from being freed on sparc.
	 *
	 * So long as we atomically load page table pointers versus teardown,
	 * we can follow the address down to the the page and take a ref on it.
	 */
	local_irq_disable();

	pgdp = pgd_offset(mm, addr);
	do {
		pgd_t pgd = *pgdp;

		next = pgd_addr_end(addr, end);
		if (pgd_none(pgd))
			goto slow;
		if (!gup_pud_range(pgd, addr, next, write, pages, &nr))
			goto slow;
	} while (pgdp++, addr = next, addr != end);

	local_irq_enable();

	VM_BUG_ON(nr != (end - start) >> PAGE_SHIFT);
	return nr;

	{
		int ret;

slow:
		local_irq_enable();

		/* Try to get the remaining pages with get_user_pages */
		start += nr << PAGE_SHIFT;
		pages += nr;

		ret = get_user_pages_unlocked(start,
			(end - start) >> PAGE_SHIFT, pages,
			write ? FOLL_WRITE : 0);

		/* Have to be a bit careful with return values */
		if (nr > 0) {
			if (ret < 0)
				ret = nr;
			else
				ret += nr;
		}

		return ret;
	}
}
sparc64: implement get_user_pages_fast() Signed-off-by: David S. Miller <davem@davemloft.net> Signed-off-by: Peter Zijlstra <a.p.zijlstra@chello.nl> Signed-off-by: Andrew Morton <akpm@linux-foundation.org> Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org> 2011-07-26 07:12:22 +07:00			`/*`
			`* Lockless get_user_pages_fast for sparc, cribbed from powerpc`
			`*`
			`* Copyright (C) 2008 Nick Piggin`
			`* Copyright (C) 2008 Novell Inc.`
			`*/`

			`#include <linux/sched.h>`
			`#include <linux/mm.h>`
			`#include <linux/vmstat.h>`
			`#include <linux/pagemap.h>`
			`#include <linux/rwsem.h>`
			`#include <asm/pgtable.h>`

			`/*`
			`* The performance critical leaf functions are made noinline otherwise gcc`
			`* inlines everything into a single function which results in too much`
			`* register pressure.`
			`*/`
			`static noinline int gup_pte_range(pmd_t pmd, unsigned long addr,`
			`unsigned long end, int write, struct page *pages, int nr)`
			`{`
			`unsigned long mask, result;`
			`pte_t *ptep;`

			`if (tlb_type == hypervisor) {`
			`result = _PAGE_PRESENT_4V\|_PAGE_P_4V;`
			`if (write)`
			`result \|= _PAGE_WRITE_4V;`
			`} else {`
			`result = _PAGE_PRESENT_4U\|_PAGE_P_4U;`
			`if (write)`
			`result \|= _PAGE_WRITE_4U;`
			`}`
			`mask = result \| _PAGE_SPECIAL;`

			`ptep = pte_offset_kernel(&pmd, addr);`
			`do {`
			`struct page page, head;`
			`pte_t pte = *ptep;`

			`if ((pte_val(pte) & mask) != result)`
			`return 0;`
			`VM_BUG_ON(!pfn_valid(pte_pfn(pte)));`

			`/* The hugepage case is simplified on sparc64 because`
			`* we encode the sub-page pfn offsets into the`
			`* hugepage PTEs. We could optimize this in the future`
			`* use page_cache_add_speculative() for the hugepage case.`
			`*/`
			`page = pte_page(pte);`
			`head = compound_head(page);`
			`if (!page_cache_get_speculative(head))`
			`return 0;`
			`if (unlikely(pte_val(pte) != pte_val(*ptep))) {`
			`put_page(head);`
			`return 0;`
			`}`

			`pages[*nr] = page;`
			`(*nr)++;`
			`} while (ptep++, addr += PAGE_SIZE, addr != end);`

			`return 1;`
			`}`

sparc64: Fix get_user_pages_fast() wrt. THP. Mostly mirrors the s390 logic, as unlike x86 we don't need the SetPageReferenced() bits. On sparc64 we also lack a user/privileged bit in the huge PMDs. In order to make this work for THP and non-THP builds, some header file adjustments were necessary. Namely, provide the PMD_HUGE_* bit defines and the pmd_large() inline unconditionally rather than protected by TRANSPARENT_HUGEPAGE. Reported-by: Aneesh Kumar K.V <aneesh.kumar@linux.vnet.ibm.com> Signed-off-by: David S. Miller <davem@davemloft.net> 2013-02-14 03:21:06 +07:00			`static int gup_huge_pmd(pmd_t *pmdp, pmd_t pmd, unsigned long addr,`
			`unsigned long end, int write, struct page **pages,`
			`int *nr)`
			`{`
mm: drop tail page refcounting Tail page refcounting is utterly complicated and painful to support. It uses ->_mapcount on tail pages to store how many times this page is pinned. get_page() bumps ->_mapcount on tail page in addition to ->_count on head. This information is required by split_huge_page() to be able to distribute pins from head of compound page to tails during the split. We will need ->_mapcount to account PTE mappings of subpages of the compound page. We eliminate need in current meaning of ->_mapcount in tail pages by forbidding split entirely if the page is pinned. The only user of tail page refcounting is THP which is marked BROKEN for now. Let's drop all this mess. It makes get_page() and put_page() much simpler. Signed-off-by: Kirill A. Shutemov <kirill.shutemov@linux.intel.com> Tested-by: Sasha Levin <sasha.levin@oracle.com> Tested-by: Aneesh Kumar K.V <aneesh.kumar@linux.vnet.ibm.com> Acked-by: Vlastimil Babka <vbabka@suse.cz> Acked-by: Jerome Marchand <jmarchan@redhat.com> Cc: Andrea Arcangeli <aarcange@redhat.com> Cc: Hugh Dickins <hughd@google.com> Cc: Dave Hansen <dave.hansen@intel.com> Cc: Mel Gorman <mgorman@suse.de> Cc: Rik van Riel <riel@redhat.com> Cc: Naoya Horiguchi <n-horiguchi@ah.jp.nec.com> Cc: Steve Capper <steve.capper@linaro.org> Cc: Johannes Weiner <hannes@cmpxchg.org> Cc: Michal Hocko <mhocko@suse.cz> Cc: Christoph Lameter <cl@linux.com> Cc: David Rientjes <rientjes@google.com> Signed-off-by: Andrew Morton <akpm@linux-foundation.org> Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org> 2016-01-16 07:52:56 +07:00			`struct page head, page;`
sparc64: Fix get_user_pages_fast() wrt. THP. Mostly mirrors the s390 logic, as unlike x86 we don't need the SetPageReferenced() bits. On sparc64 we also lack a user/privileged bit in the huge PMDs. In order to make this work for THP and non-THP builds, some header file adjustments were necessary. Namely, provide the PMD_HUGE_* bit defines and the pmd_large() inline unconditionally rather than protected by TRANSPARENT_HUGEPAGE. Reported-by: Aneesh Kumar K.V <aneesh.kumar@linux.vnet.ibm.com> Signed-off-by: David S. Miller <davem@davemloft.net> 2013-02-14 03:21:06 +07:00			`int refs;`

sparc64: Fix bugs in get_user_pages_fast() wrt. THP. The large PMD path needs to check _PAGE_VALID not _PAGE_PRESENT, to decide if it needs to bail and return 0. pmd_large() should therefore just check _PAGE_PMD_HUGE. Calls to gup_huge_pmd() are guarded with a check of pmd_large(), so we just need to add a valid bit check. Signed-off-by: David S. Miller <davem@davemloft.net> 2014-04-26 00:21:12 +07:00			`if (!(pmd_val(pmd) & _PAGE_VALID))`
sparc64: Encode huge PMDs using PTE encoding. Now that we have 64-bits for PMDs we can stop using special encodings for the huge PMD values, and just put real PTEs in there. We allocate a _PAGE_PMD_HUGE bit to distinguish between plain PMDs and huge ones. It is the same for both 4U and 4V PTE layouts. We also use _PAGE_SPECIAL to indicate the splitting state, since a huge PMD cannot also be special. All of the PMD --> PTE translation code disappears, and most of the huge PMD bit modifications and tests just degenerate into the PTE operations. In particular USER_PGTABLE_CHECK_PMD_HUGE becomes trivial. As a side effect, normal PMDs don't shift the physical address around. This also speeds up the page table walks in the TLB miss paths since they don't have to do the shifts any more. Another non-trivial aspect is that pte_modify() has to be changed to preserve the _PAGE_PMD_HUGE bits as well as the page size field of the pte. Signed-off-by: David S. Miller <davem@davemloft.net> 2013-09-27 03:45:15 +07:00			`return 0;`

			`if (write && !pmd_write(pmd))`
sparc64: Fix get_user_pages_fast() wrt. THP. Mostly mirrors the s390 logic, as unlike x86 we don't need the SetPageReferenced() bits. On sparc64 we also lack a user/privileged bit in the huge PMDs. In order to make this work for THP and non-THP builds, some header file adjustments were necessary. Namely, provide the PMD_HUGE_* bit defines and the pmd_large() inline unconditionally rather than protected by TRANSPARENT_HUGEPAGE. Reported-by: Aneesh Kumar K.V <aneesh.kumar@linux.vnet.ibm.com> Signed-off-by: David S. Miller <davem@davemloft.net> 2013-02-14 03:21:06 +07:00			`return 0;`

			`refs = 0;`
sparc64: Fix gup_huge_pmd The function assumes that each PMD points to head of a huge page. This is not correct as a PMD can point to start of any 8M region with a, say 256M, hugepage. The fix ensures that it points to the correct head of any PMD huge page. Cc: Julian Calaby <julian.calaby@gmail.com> Signed-off-by: Nitin Gupta <nitin.m.gupta@oracle.com> Signed-off-by: David S. Miller <davem@davemloft.net> 2017-06-23 07:15:08 +07:00			`page = pmd_page(pmd) + ((addr & ~PMD_MASK) >> PAGE_SHIFT);`
			`head = compound_head(page);`
sparc64: Fix get_user_pages_fast() wrt. THP. Mostly mirrors the s390 logic, as unlike x86 we don't need the SetPageReferenced() bits. On sparc64 we also lack a user/privileged bit in the huge PMDs. In order to make this work for THP and non-THP builds, some header file adjustments were necessary. Namely, provide the PMD_HUGE_* bit defines and the pmd_large() inline unconditionally rather than protected by TRANSPARENT_HUGEPAGE. Reported-by: Aneesh Kumar K.V <aneesh.kumar@linux.vnet.ibm.com> Signed-off-by: David S. Miller <davem@davemloft.net> 2013-02-14 03:21:06 +07:00			`do {`
			`VM_BUG_ON(compound_head(page) != head);`
			`pages[*nr] = page;`
			`(*nr)++;`
			`page++;`
			`refs++;`
			`} while (addr += PAGE_SIZE, addr != end);`

			`if (!page_cache_add_speculative(head, refs)) {`
			`*nr -= refs;`
			`return 0;`
			`}`

			`if (unlikely(pmd_val(pmd) != pmd_val(*pmdp))) {`
			`*nr -= refs;`
			`while (refs--)`
			`put_page(head);`
			`return 0;`
			`}`

			`return 1;`
			`}`

sparc64: implement get_user_pages_fast() Signed-off-by: David S. Miller <davem@davemloft.net> Signed-off-by: Peter Zijlstra <a.p.zijlstra@chello.nl> Signed-off-by: Andrew Morton <akpm@linux-foundation.org> Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org> 2011-07-26 07:12:22 +07:00			`static int gup_pmd_range(pud_t pud, unsigned long addr, unsigned long end,`
			`int write, struct page *pages, int nr)`
			`{`
			`unsigned long next;`
			`pmd_t *pmdp;`

			`pmdp = pmd_offset(&pud, addr);`
			`do {`
			`pmd_t pmd = *pmdp;`

			`next = pmd_addr_end(addr, end);`
sparc, thp: remove infrastructure for handling splitting PMDs With new refcounting we don't need to mark PMDs splitting. Let's drop code to handle this. Signed-off-by: Kirill A. Shutemov <kirill.shutemov@linux.intel.com> Cc: Sasha Levin <sasha.levin@oracle.com> Cc: Aneesh Kumar K.V <aneesh.kumar@linux.vnet.ibm.com> Cc: Jerome Marchand <jmarchan@redhat.com> Cc: Vlastimil Babka <vbabka@suse.cz> Cc: Andrea Arcangeli <aarcange@redhat.com> Cc: Hugh Dickins <hughd@google.com> Cc: Dave Hansen <dave.hansen@intel.com> Cc: Mel Gorman <mgorman@suse.de> Cc: Rik van Riel <riel@redhat.com> Cc: Naoya Horiguchi <n-horiguchi@ah.jp.nec.com> Cc: Steve Capper <steve.capper@linaro.org> Cc: Johannes Weiner <hannes@cmpxchg.org> Cc: Michal Hocko <mhocko@suse.cz> Cc: Christoph Lameter <cl@linux.com> Cc: David Rientjes <rientjes@google.com> Signed-off-by: Andrew Morton <akpm@linux-foundation.org> Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org> 2016-01-16 07:53:28 +07:00			`if (pmd_none(pmd))`
sparc64: implement get_user_pages_fast() Signed-off-by: David S. Miller <davem@davemloft.net> Signed-off-by: Peter Zijlstra <a.p.zijlstra@chello.nl> Signed-off-by: Andrew Morton <akpm@linux-foundation.org> Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org> 2011-07-26 07:12:22 +07:00			`return 0;`
sparc64: Fix get_user_pages_fast() wrt. THP. Mostly mirrors the s390 logic, as unlike x86 we don't need the SetPageReferenced() bits. On sparc64 we also lack a user/privileged bit in the huge PMDs. In order to make this work for THP and non-THP builds, some header file adjustments were necessary. Namely, provide the PMD_HUGE_* bit defines and the pmd_large() inline unconditionally rather than protected by TRANSPARENT_HUGEPAGE. Reported-by: Aneesh Kumar K.V <aneesh.kumar@linux.vnet.ibm.com> Signed-off-by: David S. Miller <davem@davemloft.net> 2013-02-14 03:21:06 +07:00			`if (unlikely(pmd_large(pmd))) {`
			`if (!gup_huge_pmd(pmdp, pmd, addr, next,`
			`write, pages, nr))`
			`return 0;`
			`} else if (!gup_pte_range(pmd, addr, next, write,`
			`pages, nr))`
sparc64: implement get_user_pages_fast() Signed-off-by: David S. Miller <davem@davemloft.net> Signed-off-by: Peter Zijlstra <a.p.zijlstra@chello.nl> Signed-off-by: Andrew Morton <akpm@linux-foundation.org> Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org> 2011-07-26 07:12:22 +07:00			`return 0;`
			`} while (pmdp++, addr = next, addr != end);`

			`return 1;`
			`}`

			`static int gup_pud_range(pgd_t pgd, unsigned long addr, unsigned long end,`
			`int write, struct page *pages, int nr)`
			`{`
			`unsigned long next;`
			`pud_t *pudp;`

			`pudp = pud_offset(&pgd, addr);`
			`do {`
			`pud_t pud = *pudp;`

			`next = pud_addr_end(addr, end);`
			`if (pud_none(pud))`
			`return 0;`
sparc64: Revert 16GB huge page support. It overflows the amount of space available in the initial .text section of trap handler assembler in some configurations, resulting in build failures. Signed-off-by: David S. Miller <davem@davemloft.net> 2017-08-10 23:49:15 +07:00			`if (!gup_pmd_range(pud, addr, next, write, pages, nr))`
sparc64: implement get_user_pages_fast() Signed-off-by: David S. Miller <davem@davemloft.net> Signed-off-by: Peter Zijlstra <a.p.zijlstra@chello.nl> Signed-off-by: Andrew Morton <akpm@linux-foundation.org> Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org> 2011-07-26 07:12:22 +07:00			`return 0;`
			`} while (pudp++, addr = next, addr != end);`

			`return 1;`
			`}`

sparc64: Implement __get_user_pages_fast(). It is not sufficient to only implement get_user_pages_fast(), you must also implement the atomic version __get_user_pages_fast() otherwise you end up using the weak symbol fallback implementation which simply returns zero. This is dangerous, because it causes the futex code to loop forever if transparent hugepages are supported (see get_futex_key()). Signed-off-by: David S. Miller <davem@davemloft.net> 2014-10-24 23:59:02 +07:00			`int __get_user_pages_fast(unsigned long start, int nr_pages, int write,`
			`struct page **pages)`
			`{`
			`struct mm_struct *mm = current->mm;`
			`unsigned long addr, len, end;`
			`unsigned long next, flags;`
			`pgd_t *pgdp;`
			`int nr = 0;`

			`start &= PAGE_MASK;`
			`addr = start;`
			`len = (unsigned long) nr_pages << PAGE_SHIFT;`
			`end = start + len;`

			`local_irq_save(flags);`
			`pgdp = pgd_offset(mm, addr);`
			`do {`
			`pgd_t pgd = *pgdp;`

			`next = pgd_addr_end(addr, end);`
			`if (pgd_none(pgd))`
			`break;`
			`if (!gup_pud_range(pgd, addr, next, write, pages, &nr))`
			`break;`
			`} while (pgdp++, addr = next, addr != end);`
			`local_irq_restore(flags);`

			`return nr;`
			`}`

sparc64: implement get_user_pages_fast() Signed-off-by: David S. Miller <davem@davemloft.net> Signed-off-by: Peter Zijlstra <a.p.zijlstra@chello.nl> Signed-off-by: Andrew Morton <akpm@linux-foundation.org> Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org> 2011-07-26 07:12:22 +07:00			`int get_user_pages_fast(unsigned long start, int nr_pages, int write,`
			`struct page **pages)`
			`{`
			`struct mm_struct *mm = current->mm;`
			`unsigned long addr, len, end;`
			`unsigned long next;`
			`pgd_t *pgdp;`
			`int nr = 0;`

			`start &= PAGE_MASK;`
			`addr = start;`
			`len = (unsigned long) nr_pages << PAGE_SHIFT;`
			`end = start + len;`

			`/*`
			`* XXX: batch / limit 'nr', to avoid large irq off latency`
			`* needs some instrumenting to determine the common sizes used by`
			`* important workloads (eg. DB2), and whether limiting the batch size`
			`* will decrease performance.`
			`*`
			`* It seems like we're in the clear for the moment. Direct-IO is`
			`* the main guy that batches up lots of get_user_pages, and even`
			`* they are limited to 64-at-a-time which is not so many.`
			`*/`
			`/*`
			`* This doesn't prevent pagetable teardown, but does prevent`
			`* the pagetables from being freed on sparc.`
			`*`
			`* So long as we atomically load page table pointers versus teardown,`
			`* we can follow the address down to the the page and take a ref on it.`
			`*/`
			`local_irq_disable();`

			`pgdp = pgd_offset(mm, addr);`
			`do {`
			`pgd_t pgd = *pgdp;`

			`next = pgd_addr_end(addr, end);`
			`if (pgd_none(pgd))`
			`goto slow;`
			`if (!gup_pud_range(pgd, addr, next, write, pages, &nr))`
			`goto slow;`
			`} while (pgdp++, addr = next, addr != end);`

			`local_irq_enable();`

			`VM_BUG_ON(nr != (end - start) >> PAGE_SHIFT);`
			`return nr;`

			`{`
			`int ret;`

			`slow:`
			`local_irq_enable();`

			`/* Try to get the remaining pages with get_user_pages */`
			`start += nr << PAGE_SHIFT;`
			`pages += nr;`

mm/gup: Switch all callers of get_user_pages() to not pass tsk/mm We will soon modify the vanilla get_user_pages() so it can no longer be used on mm/tasks other than 'current/current->mm', which is by far the most common way it is called. For now, we allow the old-style calls, but warn when they are used. (implemented in previous patch) This patch switches all callers of: get_user_pages() get_user_pages_unlocked() get_user_pages_locked() to stop passing tsk/mm so they will no longer see the warnings. Signed-off-by: Dave Hansen <dave.hansen@linux.intel.com> Reviewed-by: Thomas Gleixner <tglx@linutronix.de> Cc: Andrea Arcangeli <aarcange@redhat.com> Cc: Andrew Morton <akpm@linux-foundation.org> Cc: Andy Lutomirski <luto@amacapital.net> Cc: Borislav Petkov <bp@alien8.de> Cc: Brian Gerst <brgerst@gmail.com> Cc: Dave Hansen <dave@sr71.net> Cc: Denys Vlasenko <dvlasenk@redhat.com> Cc: H. Peter Anvin <hpa@zytor.com> Cc: Kirill A. Shutemov <kirill.shutemov@linux.intel.com> Cc: Linus Torvalds <torvalds@linux-foundation.org> Cc: Naoya Horiguchi <n-horiguchi@ah.jp.nec.com> Cc: Peter Zijlstra <peterz@infradead.org> Cc: Rik van Riel <riel@redhat.com> Cc: Srikar Dronamraju <srikar@linux.vnet.ibm.com> Cc: Vlastimil Babka <vbabka@suse.cz> Cc: jack@suse.cz Cc: linux-mm@kvack.org Link: http://lkml.kernel.org/r/20160212210156.113E9407@viggo.jf.intel.com Signed-off-by: Ingo Molnar <mingo@kernel.org> 2016-02-13 04:01:56 +07:00			`ret = get_user_pages_unlocked(start,`
mm: replace get_user_pages_unlocked() write/force parameters with gup_flags This removes the 'write' and 'force' use from get_user_pages_unlocked() and replaces them with 'gup_flags' to make the use of FOLL_FORCE explicit in callers as use of this flag can result in surprising behaviour (and hence bugs) within the mm subsystem. Signed-off-by: Lorenzo Stoakes <lstoakes@gmail.com> Reviewed-by: Jan Kara <jack@suse.cz> Acked-by: Michal Hocko <mhocko@suse.com> Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org> 2016-10-13 07:20:13 +07:00			`(end - start) >> PAGE_SHIFT, pages,`
			`write ? FOLL_WRITE : 0);`
sparc64: implement get_user_pages_fast() Signed-off-by: David S. Miller <davem@davemloft.net> Signed-off-by: Peter Zijlstra <a.p.zijlstra@chello.nl> Signed-off-by: Andrew Morton <akpm@linux-foundation.org> Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org> 2011-07-26 07:12:22 +07:00
			`/* Have to be a bit careful with return values */`
			`if (nr > 0) {`
			`if (ret < 0)`
			`ret = nr;`
			`else`
			`ret += nr;`
			`}`

			`return ret;`
			`}`
			`}`