mirror of
				git://git.kernel.org/pub/scm/linux/kernel/git/torvalds/linux.git
				synced 2025-09-04 20:19:47 +08:00 
			
		
		
		
	 4d66bcc7cf
			
		
	
	
		4d66bcc7cf
		
	
	
	
	
		
			
			We would want to use number of page table level to define mm_struct. Let's expose it as CONFIG_PGTABLE_LEVELS. We need to define PGTABLE_LEVELS before sourcing init/Kconfig: arch/Kconfig will define default value and it's sourced from init/Kconfig. Signed-off-by: Kirill A. Shutemov <kirill.shutemov@linux.intel.com> Cc: Tony Luck <tony.luck@intel.com> Cc: Fenghua Yu <fenghua.yu@intel.com> Tested-by: Guenter Roeck <linux@roeck-us.net> Signed-off-by: Andrew Morton <akpm@linux-foundation.org> Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
		
			
				
	
	
		
			595 lines
		
	
	
		
			21 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			595 lines
		
	
	
		
			21 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
| #ifndef _ASM_IA64_PGTABLE_H
 | |
| #define _ASM_IA64_PGTABLE_H
 | |
| 
 | |
| /*
 | |
|  * This file contains the functions and defines necessary to modify and use
 | |
|  * the IA-64 page table tree.
 | |
|  *
 | |
|  * This hopefully works with any (fixed) IA-64 page-size, as defined
 | |
|  * in <asm/page.h>.
 | |
|  *
 | |
|  * Copyright (C) 1998-2005 Hewlett-Packard Co
 | |
|  *	David Mosberger-Tang <davidm@hpl.hp.com>
 | |
|  */
 | |
| 
 | |
| 
 | |
| #include <asm/mman.h>
 | |
| #include <asm/page.h>
 | |
| #include <asm/processor.h>
 | |
| #include <asm/types.h>
 | |
| 
 | |
| #define IA64_MAX_PHYS_BITS	50	/* max. number of physical address bits (architected) */
 | |
| 
 | |
| /*
 | |
|  * First, define the various bits in a PTE.  Note that the PTE format
 | |
|  * matches the VHPT short format, the firt doubleword of the VHPD long
 | |
|  * format, and the first doubleword of the TLB insertion format.
 | |
|  */
 | |
| #define _PAGE_P_BIT		0
 | |
| #define _PAGE_A_BIT		5
 | |
| #define _PAGE_D_BIT		6
 | |
| 
 | |
| #define _PAGE_P			(1 << _PAGE_P_BIT)	/* page present bit */
 | |
| #define _PAGE_MA_WB		(0x0 <<  2)	/* write back memory attribute */
 | |
| #define _PAGE_MA_UC		(0x4 <<  2)	/* uncacheable memory attribute */
 | |
| #define _PAGE_MA_UCE		(0x5 <<  2)	/* UC exported attribute */
 | |
| #define _PAGE_MA_WC		(0x6 <<  2)	/* write coalescing memory attribute */
 | |
| #define _PAGE_MA_NAT		(0x7 <<  2)	/* not-a-thing attribute */
 | |
| #define _PAGE_MA_MASK		(0x7 <<  2)
 | |
| #define _PAGE_PL_0		(0 <<  7)	/* privilege level 0 (kernel) */
 | |
| #define _PAGE_PL_1		(1 <<  7)	/* privilege level 1 (unused) */
 | |
| #define _PAGE_PL_2		(2 <<  7)	/* privilege level 2 (unused) */
 | |
| #define _PAGE_PL_3		(3 <<  7)	/* privilege level 3 (user) */
 | |
| #define _PAGE_PL_MASK		(3 <<  7)
 | |
| #define _PAGE_AR_R		(0 <<  9)	/* read only */
 | |
| #define _PAGE_AR_RX		(1 <<  9)	/* read & execute */
 | |
| #define _PAGE_AR_RW		(2 <<  9)	/* read & write */
 | |
| #define _PAGE_AR_RWX		(3 <<  9)	/* read, write & execute */
 | |
| #define _PAGE_AR_R_RW		(4 <<  9)	/* read / read & write */
 | |
| #define _PAGE_AR_RX_RWX		(5 <<  9)	/* read & exec / read, write & exec */
 | |
| #define _PAGE_AR_RWX_RW		(6 <<  9)	/* read, write & exec / read & write */
 | |
| #define _PAGE_AR_X_RX		(7 <<  9)	/* exec & promote / read & exec */
 | |
| #define _PAGE_AR_MASK		(7 <<  9)
 | |
| #define _PAGE_AR_SHIFT		9
 | |
| #define _PAGE_A			(1 << _PAGE_A_BIT)	/* page accessed bit */
 | |
| #define _PAGE_D			(1 << _PAGE_D_BIT)	/* page dirty bit */
 | |
| #define _PAGE_PPN_MASK		(((__IA64_UL(1) << IA64_MAX_PHYS_BITS) - 1) & ~0xfffUL)
 | |
| #define _PAGE_ED		(__IA64_UL(1) << 52)	/* exception deferral */
 | |
| #define _PAGE_PROTNONE		(__IA64_UL(1) << 63)
 | |
| 
 | |
| #define _PFN_MASK		_PAGE_PPN_MASK
 | |
| /* Mask of bits which may be changed by pte_modify(); the odd bits are there for _PAGE_PROTNONE */
 | |
| #define _PAGE_CHG_MASK	(_PAGE_P | _PAGE_PROTNONE | _PAGE_PL_MASK | _PAGE_AR_MASK | _PAGE_ED)
 | |
| 
 | |
| #define _PAGE_SIZE_4K	12
 | |
| #define _PAGE_SIZE_8K	13
 | |
| #define _PAGE_SIZE_16K	14
 | |
| #define _PAGE_SIZE_64K	16
 | |
| #define _PAGE_SIZE_256K	18
 | |
| #define _PAGE_SIZE_1M	20
 | |
| #define _PAGE_SIZE_4M	22
 | |
| #define _PAGE_SIZE_16M	24
 | |
| #define _PAGE_SIZE_64M	26
 | |
| #define _PAGE_SIZE_256M	28
 | |
| #define _PAGE_SIZE_1G	30
 | |
| #define _PAGE_SIZE_4G	32
 | |
| 
 | |
| #define __ACCESS_BITS		_PAGE_ED | _PAGE_A | _PAGE_P | _PAGE_MA_WB
 | |
| #define __DIRTY_BITS_NO_ED	_PAGE_A | _PAGE_P | _PAGE_D | _PAGE_MA_WB
 | |
| #define __DIRTY_BITS		_PAGE_ED | __DIRTY_BITS_NO_ED
 | |
| 
 | |
| /*
 | |
|  * How many pointers will a page table level hold expressed in shift
 | |
|  */
 | |
| #define PTRS_PER_PTD_SHIFT	(PAGE_SHIFT-3)
 | |
| 
 | |
| /*
 | |
|  * Definitions for fourth level:
 | |
|  */
 | |
| #define PTRS_PER_PTE	(__IA64_UL(1) << (PTRS_PER_PTD_SHIFT))
 | |
| 
 | |
| /*
 | |
|  * Definitions for third level:
 | |
|  *
 | |
|  * PMD_SHIFT determines the size of the area a third-level page table
 | |
|  * can map.
 | |
|  */
 | |
| #define PMD_SHIFT	(PAGE_SHIFT + (PTRS_PER_PTD_SHIFT))
 | |
| #define PMD_SIZE	(1UL << PMD_SHIFT)
 | |
| #define PMD_MASK	(~(PMD_SIZE-1))
 | |
| #define PTRS_PER_PMD	(1UL << (PTRS_PER_PTD_SHIFT))
 | |
| 
 | |
| #if CONFIG_PGTABLE_LEVELS == 4
 | |
| /*
 | |
|  * Definitions for second level:
 | |
|  *
 | |
|  * PUD_SHIFT determines the size of the area a second-level page table
 | |
|  * can map.
 | |
|  */
 | |
| #define PUD_SHIFT	(PMD_SHIFT + (PTRS_PER_PTD_SHIFT))
 | |
| #define PUD_SIZE	(1UL << PUD_SHIFT)
 | |
| #define PUD_MASK	(~(PUD_SIZE-1))
 | |
| #define PTRS_PER_PUD	(1UL << (PTRS_PER_PTD_SHIFT))
 | |
| #endif
 | |
| 
 | |
| /*
 | |
|  * Definitions for first level:
 | |
|  *
 | |
|  * PGDIR_SHIFT determines what a first-level page table entry can map.
 | |
|  */
 | |
| #if CONFIG_PGTABLE_LEVELS == 4
 | |
| #define PGDIR_SHIFT		(PUD_SHIFT + (PTRS_PER_PTD_SHIFT))
 | |
| #else
 | |
| #define PGDIR_SHIFT		(PMD_SHIFT + (PTRS_PER_PTD_SHIFT))
 | |
| #endif
 | |
| #define PGDIR_SIZE		(__IA64_UL(1) << PGDIR_SHIFT)
 | |
| #define PGDIR_MASK		(~(PGDIR_SIZE-1))
 | |
| #define PTRS_PER_PGD_SHIFT	PTRS_PER_PTD_SHIFT
 | |
| #define PTRS_PER_PGD		(1UL << PTRS_PER_PGD_SHIFT)
 | |
| #define USER_PTRS_PER_PGD	(5*PTRS_PER_PGD/8)	/* regions 0-4 are user regions */
 | |
| #define FIRST_USER_ADDRESS	0UL
 | |
| 
 | |
| /*
 | |
|  * All the normal masks have the "page accessed" bits on, as any time
 | |
|  * they are used, the page is accessed. They are cleared only by the
 | |
|  * page-out routines.
 | |
|  */
 | |
| #define PAGE_NONE	__pgprot(_PAGE_PROTNONE | _PAGE_A)
 | |
| #define PAGE_SHARED	__pgprot(__ACCESS_BITS | _PAGE_PL_3 | _PAGE_AR_RW)
 | |
| #define PAGE_READONLY	__pgprot(__ACCESS_BITS | _PAGE_PL_3 | _PAGE_AR_R)
 | |
| #define PAGE_COPY	__pgprot(__ACCESS_BITS | _PAGE_PL_3 | _PAGE_AR_R)
 | |
| #define PAGE_COPY_EXEC	__pgprot(__ACCESS_BITS | _PAGE_PL_3 | _PAGE_AR_RX)
 | |
| #define PAGE_GATE	__pgprot(__ACCESS_BITS | _PAGE_PL_0 | _PAGE_AR_X_RX)
 | |
| #define PAGE_KERNEL	__pgprot(__DIRTY_BITS  | _PAGE_PL_0 | _PAGE_AR_RWX)
 | |
| #define PAGE_KERNELRX	__pgprot(__ACCESS_BITS | _PAGE_PL_0 | _PAGE_AR_RX)
 | |
| #define PAGE_KERNEL_UC	__pgprot(__DIRTY_BITS  | _PAGE_PL_0 | _PAGE_AR_RWX | \
 | |
| 				 _PAGE_MA_UC)
 | |
| 
 | |
| # ifndef __ASSEMBLY__
 | |
| 
 | |
| #include <linux/sched.h>	/* for mm_struct */
 | |
| #include <linux/bitops.h>
 | |
| #include <asm/cacheflush.h>
 | |
| #include <asm/mmu_context.h>
 | |
| 
 | |
| /*
 | |
|  * Next come the mappings that determine how mmap() protection bits
 | |
|  * (PROT_EXEC, PROT_READ, PROT_WRITE, PROT_NONE) get implemented.  The
 | |
|  * _P version gets used for a private shared memory segment, the _S
 | |
|  * version gets used for a shared memory segment with MAP_SHARED on.
 | |
|  * In a private shared memory segment, we do a copy-on-write if a task
 | |
|  * attempts to write to the page.
 | |
|  */
 | |
| 	/* xwr */
 | |
| #define __P000	PAGE_NONE
 | |
| #define __P001	PAGE_READONLY
 | |
| #define __P010	PAGE_READONLY	/* write to priv pg -> copy & make writable */
 | |
| #define __P011	PAGE_READONLY	/* ditto */
 | |
| #define __P100	__pgprot(__ACCESS_BITS | _PAGE_PL_3 | _PAGE_AR_X_RX)
 | |
| #define __P101	__pgprot(__ACCESS_BITS | _PAGE_PL_3 | _PAGE_AR_RX)
 | |
| #define __P110	PAGE_COPY_EXEC
 | |
| #define __P111	PAGE_COPY_EXEC
 | |
| 
 | |
| #define __S000	PAGE_NONE
 | |
| #define __S001	PAGE_READONLY
 | |
| #define __S010	PAGE_SHARED	/* we don't have (and don't need) write-only */
 | |
| #define __S011	PAGE_SHARED
 | |
| #define __S100	__pgprot(__ACCESS_BITS | _PAGE_PL_3 | _PAGE_AR_X_RX)
 | |
| #define __S101	__pgprot(__ACCESS_BITS | _PAGE_PL_3 | _PAGE_AR_RX)
 | |
| #define __S110	__pgprot(__ACCESS_BITS | _PAGE_PL_3 | _PAGE_AR_RWX)
 | |
| #define __S111	__pgprot(__ACCESS_BITS | _PAGE_PL_3 | _PAGE_AR_RWX)
 | |
| 
 | |
| #define pgd_ERROR(e)	printk("%s:%d: bad pgd %016lx.\n", __FILE__, __LINE__, pgd_val(e))
 | |
| #if CONFIG_PGTABLE_LEVELS == 4
 | |
| #define pud_ERROR(e)	printk("%s:%d: bad pud %016lx.\n", __FILE__, __LINE__, pud_val(e))
 | |
| #endif
 | |
| #define pmd_ERROR(e)	printk("%s:%d: bad pmd %016lx.\n", __FILE__, __LINE__, pmd_val(e))
 | |
| #define pte_ERROR(e)	printk("%s:%d: bad pte %016lx.\n", __FILE__, __LINE__, pte_val(e))
 | |
| 
 | |
| 
 | |
| /*
 | |
|  * Some definitions to translate between mem_map, PTEs, and page addresses:
 | |
|  */
 | |
| 
 | |
| 
 | |
| /* Quick test to see if ADDR is a (potentially) valid physical address. */
 | |
| static inline long
 | |
| ia64_phys_addr_valid (unsigned long addr)
 | |
| {
 | |
| 	return (addr & (local_cpu_data->unimpl_pa_mask)) == 0;
 | |
| }
 | |
| 
 | |
| /*
 | |
|  * kern_addr_valid(ADDR) tests if ADDR is pointing to valid kernel
 | |
|  * memory.  For the return value to be meaningful, ADDR must be >=
 | |
|  * PAGE_OFFSET.  This operation can be relatively expensive (e.g.,
 | |
|  * require a hash-, or multi-level tree-lookup or something of that
 | |
|  * sort) but it guarantees to return TRUE only if accessing the page
 | |
|  * at that address does not cause an error.  Note that there may be
 | |
|  * addresses for which kern_addr_valid() returns FALSE even though an
 | |
|  * access would not cause an error (e.g., this is typically true for
 | |
|  * memory mapped I/O regions.
 | |
|  *
 | |
|  * XXX Need to implement this for IA-64.
 | |
|  */
 | |
| #define kern_addr_valid(addr)	(1)
 | |
| 
 | |
| 
 | |
| /*
 | |
|  * Now come the defines and routines to manage and access the three-level
 | |
|  * page table.
 | |
|  */
 | |
| 
 | |
| 
 | |
| #define VMALLOC_START		(RGN_BASE(RGN_GATE) + 0x200000000UL)
 | |
| #ifdef CONFIG_VIRTUAL_MEM_MAP
 | |
| # define VMALLOC_END_INIT	(RGN_BASE(RGN_GATE) + (1UL << (4*PAGE_SHIFT - 9)))
 | |
| extern unsigned long VMALLOC_END;
 | |
| #else
 | |
| #if defined(CONFIG_SPARSEMEM) && defined(CONFIG_SPARSEMEM_VMEMMAP)
 | |
| /* SPARSEMEM_VMEMMAP uses half of vmalloc... */
 | |
| # define VMALLOC_END		(RGN_BASE(RGN_GATE) + (1UL << (4*PAGE_SHIFT - 10)))
 | |
| # define vmemmap		((struct page *)VMALLOC_END)
 | |
| #else
 | |
| # define VMALLOC_END		(RGN_BASE(RGN_GATE) + (1UL << (4*PAGE_SHIFT - 9)))
 | |
| #endif
 | |
| #endif
 | |
| 
 | |
| /* fs/proc/kcore.c */
 | |
| #define	kc_vaddr_to_offset(v) ((v) - RGN_BASE(RGN_GATE))
 | |
| #define	kc_offset_to_vaddr(o) ((o) + RGN_BASE(RGN_GATE))
 | |
| 
 | |
| #define RGN_MAP_SHIFT (PGDIR_SHIFT + PTRS_PER_PGD_SHIFT - 3)
 | |
| #define RGN_MAP_LIMIT	((1UL << RGN_MAP_SHIFT) - PAGE_SIZE)	/* per region addr limit */
 | |
| 
 | |
| /*
 | |
|  * Conversion functions: convert page frame number (pfn) and a protection value to a page
 | |
|  * table entry (pte).
 | |
|  */
 | |
| #define pfn_pte(pfn, pgprot) \
 | |
| ({ pte_t __pte; pte_val(__pte) = ((pfn) << PAGE_SHIFT) | pgprot_val(pgprot); __pte; })
 | |
| 
 | |
| /* Extract pfn from pte.  */
 | |
| #define pte_pfn(_pte)		((pte_val(_pte) & _PFN_MASK) >> PAGE_SHIFT)
 | |
| 
 | |
| #define mk_pte(page, pgprot)	pfn_pte(page_to_pfn(page), (pgprot))
 | |
| 
 | |
| /* This takes a physical page address that is used by the remapping functions */
 | |
| #define mk_pte_phys(physpage, pgprot) \
 | |
| ({ pte_t __pte; pte_val(__pte) = physpage + pgprot_val(pgprot); __pte; })
 | |
| 
 | |
| #define pte_modify(_pte, newprot) \
 | |
| 	(__pte((pte_val(_pte) & ~_PAGE_CHG_MASK) | (pgprot_val(newprot) & _PAGE_CHG_MASK)))
 | |
| 
 | |
| #define pte_none(pte) 			(!pte_val(pte))
 | |
| #define pte_present(pte)		(pte_val(pte) & (_PAGE_P | _PAGE_PROTNONE))
 | |
| #define pte_clear(mm,addr,pte)		(pte_val(*(pte)) = 0UL)
 | |
| /* pte_page() returns the "struct page *" corresponding to the PTE: */
 | |
| #define pte_page(pte)			virt_to_page(((pte_val(pte) & _PFN_MASK) + PAGE_OFFSET))
 | |
| 
 | |
| #define pmd_none(pmd)			(!pmd_val(pmd))
 | |
| #define pmd_bad(pmd)			(!ia64_phys_addr_valid(pmd_val(pmd)))
 | |
| #define pmd_present(pmd)		(pmd_val(pmd) != 0UL)
 | |
| #define pmd_clear(pmdp)			(pmd_val(*(pmdp)) = 0UL)
 | |
| #define pmd_page_vaddr(pmd)		((unsigned long) __va(pmd_val(pmd) & _PFN_MASK))
 | |
| #define pmd_page(pmd)			virt_to_page((pmd_val(pmd) + PAGE_OFFSET))
 | |
| 
 | |
| #define pud_none(pud)			(!pud_val(pud))
 | |
| #define pud_bad(pud)			(!ia64_phys_addr_valid(pud_val(pud)))
 | |
| #define pud_present(pud)		(pud_val(pud) != 0UL)
 | |
| #define pud_clear(pudp)			(pud_val(*(pudp)) = 0UL)
 | |
| #define pud_page_vaddr(pud)		((unsigned long) __va(pud_val(pud) & _PFN_MASK))
 | |
| #define pud_page(pud)			virt_to_page((pud_val(pud) + PAGE_OFFSET))
 | |
| 
 | |
| #if CONFIG_PGTABLE_LEVELS == 4
 | |
| #define pgd_none(pgd)			(!pgd_val(pgd))
 | |
| #define pgd_bad(pgd)			(!ia64_phys_addr_valid(pgd_val(pgd)))
 | |
| #define pgd_present(pgd)		(pgd_val(pgd) != 0UL)
 | |
| #define pgd_clear(pgdp)			(pgd_val(*(pgdp)) = 0UL)
 | |
| #define pgd_page_vaddr(pgd)		((unsigned long) __va(pgd_val(pgd) & _PFN_MASK))
 | |
| #define pgd_page(pgd)			virt_to_page((pgd_val(pgd) + PAGE_OFFSET))
 | |
| #endif
 | |
| 
 | |
| /*
 | |
|  * The following have defined behavior only work if pte_present() is true.
 | |
|  */
 | |
| #define pte_write(pte)	((unsigned) (((pte_val(pte) & _PAGE_AR_MASK) >> _PAGE_AR_SHIFT) - 2) <= 4)
 | |
| #define pte_exec(pte)		((pte_val(pte) & _PAGE_AR_RX) != 0)
 | |
| #define pte_dirty(pte)		((pte_val(pte) & _PAGE_D) != 0)
 | |
| #define pte_young(pte)		((pte_val(pte) & _PAGE_A) != 0)
 | |
| #define pte_special(pte)	0
 | |
| 
 | |
| /*
 | |
|  * Note: we convert AR_RWX to AR_RX and AR_RW to AR_R by clearing the 2nd bit in the
 | |
|  * access rights:
 | |
|  */
 | |
| #define pte_wrprotect(pte)	(__pte(pte_val(pte) & ~_PAGE_AR_RW))
 | |
| #define pte_mkwrite(pte)	(__pte(pte_val(pte) | _PAGE_AR_RW))
 | |
| #define pte_mkold(pte)		(__pte(pte_val(pte) & ~_PAGE_A))
 | |
| #define pte_mkyoung(pte)	(__pte(pte_val(pte) | _PAGE_A))
 | |
| #define pte_mkclean(pte)	(__pte(pte_val(pte) & ~_PAGE_D))
 | |
| #define pte_mkdirty(pte)	(__pte(pte_val(pte) | _PAGE_D))
 | |
| #define pte_mkhuge(pte)		(__pte(pte_val(pte)))
 | |
| #define pte_mkspecial(pte)	(pte)
 | |
| 
 | |
| /*
 | |
|  * Because ia64's Icache and Dcache is not coherent (on a cpu), we need to
 | |
|  * sync icache and dcache when we insert *new* executable page.
 | |
|  *  __ia64_sync_icache_dcache() check Pg_arch_1 bit and flush icache
 | |
|  * if necessary.
 | |
|  *
 | |
|  *  set_pte() is also called by the kernel, but we can expect that the kernel
 | |
|  *  flushes icache explicitly if necessary.
 | |
|  */
 | |
| #define pte_present_exec_user(pte)\
 | |
| 	((pte_val(pte) & (_PAGE_P | _PAGE_PL_MASK | _PAGE_AR_RX)) == \
 | |
| 		(_PAGE_P | _PAGE_PL_3 | _PAGE_AR_RX))
 | |
| 
 | |
| extern void __ia64_sync_icache_dcache(pte_t pteval);
 | |
| static inline void set_pte(pte_t *ptep, pte_t pteval)
 | |
| {
 | |
| 	/* page is present && page is user  && page is executable
 | |
| 	 * && (page swapin or new page or page migraton
 | |
| 	 *	|| copy_on_write with page copying.)
 | |
| 	 */
 | |
| 	if (pte_present_exec_user(pteval) &&
 | |
| 	    (!pte_present(*ptep) ||
 | |
| 		pte_pfn(*ptep) != pte_pfn(pteval)))
 | |
| 		/* load_module() calles flush_icache_range() explicitly*/
 | |
| 		__ia64_sync_icache_dcache(pteval);
 | |
| 	*ptep = pteval;
 | |
| }
 | |
| 
 | |
| #define set_pte_at(mm,addr,ptep,pteval) set_pte(ptep,pteval)
 | |
| 
 | |
| /*
 | |
|  * Make page protection values cacheable, uncacheable, or write-
 | |
|  * combining.  Note that "protection" is really a misnomer here as the
 | |
|  * protection value contains the memory attribute bits, dirty bits, and
 | |
|  * various other bits as well.
 | |
|  */
 | |
| #define pgprot_cacheable(prot)		__pgprot((pgprot_val(prot) & ~_PAGE_MA_MASK) | _PAGE_MA_WB)
 | |
| #define pgprot_noncached(prot)		__pgprot((pgprot_val(prot) & ~_PAGE_MA_MASK) | _PAGE_MA_UC)
 | |
| #define pgprot_writecombine(prot)	__pgprot((pgprot_val(prot) & ~_PAGE_MA_MASK) | _PAGE_MA_WC)
 | |
| 
 | |
| struct file;
 | |
| extern pgprot_t phys_mem_access_prot(struct file *file, unsigned long pfn,
 | |
| 				     unsigned long size, pgprot_t vma_prot);
 | |
| #define __HAVE_PHYS_MEM_ACCESS_PROT
 | |
| 
 | |
| static inline unsigned long
 | |
| pgd_index (unsigned long address)
 | |
| {
 | |
| 	unsigned long region = address >> 61;
 | |
| 	unsigned long l1index = (address >> PGDIR_SHIFT) & ((PTRS_PER_PGD >> 3) - 1);
 | |
| 
 | |
| 	return (region << (PAGE_SHIFT - 6)) | l1index;
 | |
| }
 | |
| 
 | |
| /* The offset in the 1-level directory is given by the 3 region bits
 | |
|    (61..63) and the level-1 bits.  */
 | |
| static inline pgd_t*
 | |
| pgd_offset (const struct mm_struct *mm, unsigned long address)
 | |
| {
 | |
| 	return mm->pgd + pgd_index(address);
 | |
| }
 | |
| 
 | |
| /* In the kernel's mapped region we completely ignore the region number
 | |
|    (since we know it's in region number 5). */
 | |
| #define pgd_offset_k(addr) \
 | |
| 	(init_mm.pgd + (((addr) >> PGDIR_SHIFT) & (PTRS_PER_PGD - 1)))
 | |
| 
 | |
| /* Look up a pgd entry in the gate area.  On IA-64, the gate-area
 | |
|    resides in the kernel-mapped segment, hence we use pgd_offset_k()
 | |
|    here.  */
 | |
| #define pgd_offset_gate(mm, addr)	pgd_offset_k(addr)
 | |
| 
 | |
| #if CONFIG_PGTABLE_LEVELS == 4
 | |
| /* Find an entry in the second-level page table.. */
 | |
| #define pud_offset(dir,addr) \
 | |
| 	((pud_t *) pgd_page_vaddr(*(dir)) + (((addr) >> PUD_SHIFT) & (PTRS_PER_PUD - 1)))
 | |
| #endif
 | |
| 
 | |
| /* Find an entry in the third-level page table.. */
 | |
| #define pmd_offset(dir,addr) \
 | |
| 	((pmd_t *) pud_page_vaddr(*(dir)) + (((addr) >> PMD_SHIFT) & (PTRS_PER_PMD - 1)))
 | |
| 
 | |
| /*
 | |
|  * Find an entry in the third-level page table.  This looks more complicated than it
 | |
|  * should be because some platforms place page tables in high memory.
 | |
|  */
 | |
| #define pte_index(addr)	 	(((addr) >> PAGE_SHIFT) & (PTRS_PER_PTE - 1))
 | |
| #define pte_offset_kernel(dir,addr)	((pte_t *) pmd_page_vaddr(*(dir)) + pte_index(addr))
 | |
| #define pte_offset_map(dir,addr)	pte_offset_kernel(dir, addr)
 | |
| #define pte_unmap(pte)			do { } while (0)
 | |
| 
 | |
| /* atomic versions of the some PTE manipulations: */
 | |
| 
 | |
| static inline int
 | |
| ptep_test_and_clear_young (struct vm_area_struct *vma, unsigned long addr, pte_t *ptep)
 | |
| {
 | |
| #ifdef CONFIG_SMP
 | |
| 	if (!pte_young(*ptep))
 | |
| 		return 0;
 | |
| 	return test_and_clear_bit(_PAGE_A_BIT, ptep);
 | |
| #else
 | |
| 	pte_t pte = *ptep;
 | |
| 	if (!pte_young(pte))
 | |
| 		return 0;
 | |
| 	set_pte_at(vma->vm_mm, addr, ptep, pte_mkold(pte));
 | |
| 	return 1;
 | |
| #endif
 | |
| }
 | |
| 
 | |
| static inline pte_t
 | |
| ptep_get_and_clear(struct mm_struct *mm, unsigned long addr, pte_t *ptep)
 | |
| {
 | |
| #ifdef CONFIG_SMP
 | |
| 	return __pte(xchg((long *) ptep, 0));
 | |
| #else
 | |
| 	pte_t pte = *ptep;
 | |
| 	pte_clear(mm, addr, ptep);
 | |
| 	return pte;
 | |
| #endif
 | |
| }
 | |
| 
 | |
| static inline void
 | |
| ptep_set_wrprotect(struct mm_struct *mm, unsigned long addr, pte_t *ptep)
 | |
| {
 | |
| #ifdef CONFIG_SMP
 | |
| 	unsigned long new, old;
 | |
| 
 | |
| 	do {
 | |
| 		old = pte_val(*ptep);
 | |
| 		new = pte_val(pte_wrprotect(__pte (old)));
 | |
| 	} while (cmpxchg((unsigned long *) ptep, old, new) != old);
 | |
| #else
 | |
| 	pte_t old_pte = *ptep;
 | |
| 	set_pte_at(mm, addr, ptep, pte_wrprotect(old_pte));
 | |
| #endif
 | |
| }
 | |
| 
 | |
| static inline int
 | |
| pte_same (pte_t a, pte_t b)
 | |
| {
 | |
| 	return pte_val(a) == pte_val(b);
 | |
| }
 | |
| 
 | |
| #define update_mmu_cache(vma, address, ptep) do { } while (0)
 | |
| 
 | |
| extern pgd_t swapper_pg_dir[PTRS_PER_PGD];
 | |
| extern void paging_init (void);
 | |
| 
 | |
| /*
 | |
|  * Note: The macros below rely on the fact that MAX_SWAPFILES_SHIFT <= number of
 | |
|  *	 bits in the swap-type field of the swap pte.  It would be nice to
 | |
|  *	 enforce that, but we can't easily include <linux/swap.h> here.
 | |
|  *	 (Of course, better still would be to define MAX_SWAPFILES_SHIFT here...).
 | |
|  *
 | |
|  * Format of swap pte:
 | |
|  *	bit   0   : present bit (must be zero)
 | |
|  *	bits  1- 7: swap-type
 | |
|  *	bits  8-62: swap offset
 | |
|  *	bit  63   : _PAGE_PROTNONE bit
 | |
|  */
 | |
| #define __swp_type(entry)		(((entry).val >> 1) & 0x7f)
 | |
| #define __swp_offset(entry)		(((entry).val << 1) >> 9)
 | |
| #define __swp_entry(type,offset)	((swp_entry_t) { ((type) << 1) | ((long) (offset) << 8) })
 | |
| #define __pte_to_swp_entry(pte)		((swp_entry_t) { pte_val(pte) })
 | |
| #define __swp_entry_to_pte(x)		((pte_t) { (x).val })
 | |
| 
 | |
| /*
 | |
|  * ZERO_PAGE is a global shared page that is always zero: used
 | |
|  * for zero-mapped memory areas etc..
 | |
|  */
 | |
| extern unsigned long empty_zero_page[PAGE_SIZE/sizeof(unsigned long)];
 | |
| extern struct page *zero_page_memmap_ptr;
 | |
| #define ZERO_PAGE(vaddr) (zero_page_memmap_ptr)
 | |
| 
 | |
| /* We provide our own get_unmapped_area to cope with VA holes for userland */
 | |
| #define HAVE_ARCH_UNMAPPED_AREA
 | |
| 
 | |
| #ifdef CONFIG_HUGETLB_PAGE
 | |
| #define HUGETLB_PGDIR_SHIFT	(HPAGE_SHIFT + 2*(PAGE_SHIFT-3))
 | |
| #define HUGETLB_PGDIR_SIZE	(__IA64_UL(1) << HUGETLB_PGDIR_SHIFT)
 | |
| #define HUGETLB_PGDIR_MASK	(~(HUGETLB_PGDIR_SIZE-1))
 | |
| #endif
 | |
| 
 | |
| 
 | |
| #define __HAVE_ARCH_PTEP_SET_ACCESS_FLAGS
 | |
| /*
 | |
|  * Update PTEP with ENTRY, which is guaranteed to be a less
 | |
|  * restrictive PTE.  That is, ENTRY may have the ACCESSED, DIRTY, and
 | |
|  * WRITABLE bits turned on, when the value at PTEP did not.  The
 | |
|  * WRITABLE bit may only be turned if SAFELY_WRITABLE is TRUE.
 | |
|  *
 | |
|  * SAFELY_WRITABLE is TRUE if we can update the value at PTEP without
 | |
|  * having to worry about races.  On SMP machines, there are only two
 | |
|  * cases where this is true:
 | |
|  *
 | |
|  *	(1) *PTEP has the PRESENT bit turned OFF
 | |
|  *	(2) ENTRY has the DIRTY bit turned ON
 | |
|  *
 | |
|  * On ia64, we could implement this routine with a cmpxchg()-loop
 | |
|  * which ORs in the _PAGE_A/_PAGE_D bit if they're set in ENTRY.
 | |
|  * However, like on x86, we can get a more streamlined version by
 | |
|  * observing that it is OK to drop ACCESSED bit updates when
 | |
|  * SAFELY_WRITABLE is FALSE.  Besides being rare, all that would do is
 | |
|  * result in an extra Access-bit fault, which would then turn on the
 | |
|  * ACCESSED bit in the low-level fault handler (iaccess_bit or
 | |
|  * daccess_bit in ivt.S).
 | |
|  */
 | |
| #ifdef CONFIG_SMP
 | |
| # define ptep_set_access_flags(__vma, __addr, __ptep, __entry, __safely_writable) \
 | |
| ({									\
 | |
| 	int __changed = !pte_same(*(__ptep), __entry);			\
 | |
| 	if (__changed && __safely_writable) {				\
 | |
| 		set_pte(__ptep, __entry);				\
 | |
| 		flush_tlb_page(__vma, __addr);				\
 | |
| 	}								\
 | |
| 	__changed;							\
 | |
| })
 | |
| #else
 | |
| # define ptep_set_access_flags(__vma, __addr, __ptep, __entry, __safely_writable) \
 | |
| ({									\
 | |
| 	int __changed = !pte_same(*(__ptep), __entry);			\
 | |
| 	if (__changed) {						\
 | |
| 		set_pte_at((__vma)->vm_mm, (__addr), __ptep, __entry);	\
 | |
| 		flush_tlb_page(__vma, __addr);				\
 | |
| 	}								\
 | |
| 	__changed;							\
 | |
| })
 | |
| #endif
 | |
| 
 | |
| #  ifdef CONFIG_VIRTUAL_MEM_MAP
 | |
|   /* arch mem_map init routine is needed due to holes in a virtual mem_map */
 | |
| #   define __HAVE_ARCH_MEMMAP_INIT
 | |
|     extern void memmap_init (unsigned long size, int nid, unsigned long zone,
 | |
| 			     unsigned long start_pfn);
 | |
| #  endif /* CONFIG_VIRTUAL_MEM_MAP */
 | |
| # endif /* !__ASSEMBLY__ */
 | |
| 
 | |
| /*
 | |
|  * Identity-mapped regions use a large page size.  We'll call such large pages
 | |
|  * "granules".  If you can think of a better name that's unambiguous, let me
 | |
|  * know...
 | |
|  */
 | |
| #if defined(CONFIG_IA64_GRANULE_64MB)
 | |
| # define IA64_GRANULE_SHIFT	_PAGE_SIZE_64M
 | |
| #elif defined(CONFIG_IA64_GRANULE_16MB)
 | |
| # define IA64_GRANULE_SHIFT	_PAGE_SIZE_16M
 | |
| #endif
 | |
| #define IA64_GRANULE_SIZE	(1 << IA64_GRANULE_SHIFT)
 | |
| /*
 | |
|  * log2() of the page size we use to map the kernel image (IA64_TR_KERNEL):
 | |
|  */
 | |
| #define KERNEL_TR_PAGE_SHIFT	_PAGE_SIZE_64M
 | |
| #define KERNEL_TR_PAGE_SIZE	(1 << KERNEL_TR_PAGE_SHIFT)
 | |
| 
 | |
| /*
 | |
|  * No page table caches to initialise
 | |
|  */
 | |
| #define pgtable_cache_init()	do { } while (0)
 | |
| 
 | |
| /* These tell get_user_pages() that the first gate page is accessible from user-level.  */
 | |
| #define FIXADDR_USER_START	GATE_ADDR
 | |
| #ifdef HAVE_BUGGY_SEGREL
 | |
| # define FIXADDR_USER_END	(GATE_ADDR + 2*PAGE_SIZE)
 | |
| #else
 | |
| # define FIXADDR_USER_END	(GATE_ADDR + 2*PERCPU_PAGE_SIZE)
 | |
| #endif
 | |
| 
 | |
| #define __HAVE_ARCH_PTEP_TEST_AND_CLEAR_YOUNG
 | |
| #define __HAVE_ARCH_PTEP_GET_AND_CLEAR
 | |
| #define __HAVE_ARCH_PTEP_SET_WRPROTECT
 | |
| #define __HAVE_ARCH_PTE_SAME
 | |
| #define __HAVE_ARCH_PGD_OFFSET_GATE
 | |
| 
 | |
| 
 | |
| #if CONFIG_PGTABLE_LEVELS == 3
 | |
| #include <asm-generic/pgtable-nopud.h>
 | |
| #endif
 | |
| #include <asm-generic/pgtable.h>
 | |
| 
 | |
| #endif /* _ASM_IA64_PGTABLE_H */
 |