Path: blob/master/arch/powerpc/include/asm/book3s/64/pgtable.h
51344 views
/* SPDX-License-Identifier: GPL-2.0 */1#ifndef _ASM_POWERPC_BOOK3S_64_PGTABLE_H_2#define _ASM_POWERPC_BOOK3S_64_PGTABLE_H_34#include <asm-generic/pgtable-nop4d.h>56#ifndef __ASSEMBLER__7#include <linux/mmdebug.h>8#include <linux/bug.h>9#include <linux/sizes.h>10#endif1112/*13* Common bits between hash and Radix page table14*/1516#define _PAGE_EXEC 0x00001 /* execute permission */17#define _PAGE_WRITE 0x00002 /* write access allowed */18#define _PAGE_READ 0x00004 /* read access allowed */19#define _PAGE_PRIVILEGED 0x00008 /* kernel access only */20#define _PAGE_SAO 0x00010 /* Strong access order */21#define _PAGE_NON_IDEMPOTENT 0x00020 /* non idempotent memory */22#define _PAGE_TOLERANT 0x00030 /* tolerant memory, cache inhibited */23#define _PAGE_DIRTY 0x00080 /* C: page changed */24#define _PAGE_ACCESSED 0x00100 /* R: page referenced */25/*26* Software bits27*/28#define _RPAGE_SW0 0x2000000000000000UL29#define _RPAGE_SW1 0x0080030#define _RPAGE_SW2 0x0040031#define _RPAGE_SW3 0x0020032#define _RPAGE_RSV1 0x00040UL3334#define _RPAGE_PKEY_BIT4 0x1000000000000000UL35#define _RPAGE_PKEY_BIT3 0x0800000000000000UL36#define _RPAGE_PKEY_BIT2 0x0400000000000000UL37#define _RPAGE_PKEY_BIT1 0x0200000000000000UL38#define _RPAGE_PKEY_BIT0 0x0100000000000000UL3940#define _PAGE_PTE 0x4000000000000000UL /* distinguishes PTEs from pointers */41#define _PAGE_PRESENT 0x8000000000000000UL /* pte contains a translation */42/*43* We need to mark a pmd pte invalid while splitting. We can do that by clearing44* the _PAGE_PRESENT bit. But then that will be taken as a swap pte. In order to45* differentiate between two use a SW field when invalidating.46*47* We do that temporary invalidate for regular pte entry in ptep_set_access_flags48*49* This is used only when _PAGE_PRESENT is cleared.50*/51#define _PAGE_INVALID _RPAGE_SW05253/*54* Top and bottom bits of RPN which can be used by hash55* translation mode, because we expect them to be zero56* otherwise.57*/58#define _RPAGE_RPN0 0x0100059#define _RPAGE_RPN1 0x0200060#define _RPAGE_RPN43 0x0080000000000000UL61#define _RPAGE_RPN42 0x0040000000000000UL62#define _RPAGE_RPN41 0x0020000000000000UL6364/* Max physical address bit as per radix table */65#define _RPAGE_PA_MAX 566667/*68* Max physical address bit we will use for now.69*70* This is mostly a hardware limitation and for now Power9 has71* a 51 bit limit.72*73* This is different from the number of physical bit required to address74* the last byte of memory. That is defined by MAX_PHYSMEM_BITS.75* MAX_PHYSMEM_BITS is a linux limitation imposed by the maximum76* number of sections we can support (SECTIONS_SHIFT).77*78* This is different from Radix page table limitation above and79* should always be less than that. The limit is done such that80* we can overload the bits between _RPAGE_PA_MAX and _PAGE_PA_MAX81* for hash linux page table specific bits.82*83* In order to be compatible with future hardware generations we keep84* some offsets and limit this for now to 5385*/86#define _PAGE_PA_MAX 538788#define _PAGE_SOFT_DIRTY _RPAGE_SW3 /* software: software dirty tracking */89#define _PAGE_SPECIAL _RPAGE_SW2 /* software: special page */9091/*92* Drivers request for cache inhibited pte mapping using _PAGE_NO_CACHE93* Instead of fixing all of them, add an alternate define which94* maps CI pte mapping.95*/96#define _PAGE_NO_CACHE _PAGE_TOLERANT97/*98* We support _RPAGE_PA_MAX bit real address in pte. On the linux side99* we are limited by _PAGE_PA_MAX. Clear everything above _PAGE_PA_MAX100* and every thing below PAGE_SHIFT;101*/102#define PTE_RPN_MASK (((1UL << _PAGE_PA_MAX) - 1) & (PAGE_MASK))103#define PTE_RPN_SHIFT PAGE_SHIFT104/*105* set of bits not changed in pmd_modify. Even though we have hash specific bits106* in here, on radix we expect them to be zero.107*/108#define _HPAGE_CHG_MASK (PTE_RPN_MASK | _PAGE_HPTEFLAGS | _PAGE_DIRTY | \109_PAGE_ACCESSED | H_PAGE_THP_HUGE | _PAGE_PTE | \110_PAGE_SOFT_DIRTY)111/*112* user access blocked by key113*/114#define _PAGE_KERNEL_RW (_PAGE_PRIVILEGED | _PAGE_RW | _PAGE_DIRTY)115#define _PAGE_KERNEL_RO (_PAGE_PRIVILEGED | _PAGE_READ)116#define _PAGE_KERNEL_ROX (_PAGE_PRIVILEGED | _PAGE_READ | _PAGE_EXEC)117#define _PAGE_KERNEL_RWX (_PAGE_PRIVILEGED | _PAGE_DIRTY | _PAGE_RW | _PAGE_EXEC)118/*119* _PAGE_CHG_MASK masks of bits that are to be preserved across120* pgprot changes121*/122#define _PAGE_CHG_MASK (PTE_RPN_MASK | _PAGE_HPTEFLAGS | _PAGE_DIRTY | \123_PAGE_ACCESSED | _PAGE_SPECIAL | _PAGE_PTE | \124_PAGE_SOFT_DIRTY)125126/*127* We define 2 sets of base prot bits, one for basic pages (ie,128* cacheable kernel and user pages) and one for non cacheable129* pages. We always set _PAGE_COHERENT when SMP is enabled or130* the processor might need it for DMA coherency.131*/132#define _PAGE_BASE_NC (_PAGE_PRESENT | _PAGE_ACCESSED)133#define _PAGE_BASE (_PAGE_BASE_NC)134135#include <asm/pgtable-masks.h>136137/* Permission masks used for kernel mappings */138#define PAGE_KERNEL __pgprot(_PAGE_BASE | _PAGE_KERNEL_RW)139#define PAGE_KERNEL_NC __pgprot(_PAGE_BASE_NC | _PAGE_KERNEL_RW | _PAGE_TOLERANT)140#define PAGE_KERNEL_NCG __pgprot(_PAGE_BASE_NC | _PAGE_KERNEL_RW | _PAGE_NON_IDEMPOTENT)141#define PAGE_KERNEL_X __pgprot(_PAGE_BASE | _PAGE_KERNEL_RWX)142#define PAGE_KERNEL_RO __pgprot(_PAGE_BASE | _PAGE_KERNEL_RO)143#define PAGE_KERNEL_ROX __pgprot(_PAGE_BASE | _PAGE_KERNEL_ROX)144145#ifndef __ASSEMBLER__146#include <linux/page_table_check.h>147148/*149* page table defines150*/151extern unsigned long __pte_index_size;152extern unsigned long __pmd_index_size;153extern unsigned long __pud_index_size;154extern unsigned long __pgd_index_size;155extern unsigned long __pud_cache_index;156#define PTE_INDEX_SIZE __pte_index_size157#define PMD_INDEX_SIZE __pmd_index_size158#define PUD_INDEX_SIZE __pud_index_size159#define PGD_INDEX_SIZE __pgd_index_size160/* pmd table use page table fragments */161#define PMD_CACHE_INDEX 0162#define PUD_CACHE_INDEX __pud_cache_index163/*164* Because of use of pte fragments and THP, size of page table165* are not always derived out of index size above.166*/167extern unsigned long __pte_table_size;168extern unsigned long __pmd_table_size;169extern unsigned long __pud_table_size;170extern unsigned long __pgd_table_size;171#define PTE_TABLE_SIZE __pte_table_size172#define PMD_TABLE_SIZE __pmd_table_size173#define PUD_TABLE_SIZE __pud_table_size174#define PGD_TABLE_SIZE __pgd_table_size175176extern unsigned long __pmd_val_bits;177extern unsigned long __pud_val_bits;178extern unsigned long __pgd_val_bits;179#define PMD_VAL_BITS __pmd_val_bits180#define PUD_VAL_BITS __pud_val_bits181#define PGD_VAL_BITS __pgd_val_bits182183extern unsigned long __pte_frag_nr;184#define PTE_FRAG_NR __pte_frag_nr185extern unsigned long __pte_frag_size_shift;186#define PTE_FRAG_SIZE_SHIFT __pte_frag_size_shift187#define PTE_FRAG_SIZE (1UL << PTE_FRAG_SIZE_SHIFT)188189extern unsigned long __pmd_frag_nr;190#define PMD_FRAG_NR __pmd_frag_nr191extern unsigned long __pmd_frag_size_shift;192#define PMD_FRAG_SIZE_SHIFT __pmd_frag_size_shift193#define PMD_FRAG_SIZE (1UL << PMD_FRAG_SIZE_SHIFT)194195#define PTRS_PER_PTE (1 << PTE_INDEX_SIZE)196#define PTRS_PER_PMD (1 << PMD_INDEX_SIZE)197#define PTRS_PER_PUD (1 << PUD_INDEX_SIZE)198#define PTRS_PER_PGD (1 << PGD_INDEX_SIZE)199200#define MAX_PTRS_PER_PTE ((H_PTRS_PER_PTE > R_PTRS_PER_PTE) ? H_PTRS_PER_PTE : R_PTRS_PER_PTE)201#define MAX_PTRS_PER_PMD ((H_PTRS_PER_PMD > R_PTRS_PER_PMD) ? H_PTRS_PER_PMD : R_PTRS_PER_PMD)202#define MAX_PTRS_PER_PUD ((H_PTRS_PER_PUD > R_PTRS_PER_PUD) ? H_PTRS_PER_PUD : R_PTRS_PER_PUD)203#define MAX_PTRS_PER_PGD (1 << (H_PGD_INDEX_SIZE > RADIX_PGD_INDEX_SIZE ? \204H_PGD_INDEX_SIZE : RADIX_PGD_INDEX_SIZE))205206/* PMD_SHIFT determines what a second-level page table entry can map */207#define PMD_SHIFT (PAGE_SHIFT + PTE_INDEX_SIZE)208#define PMD_SIZE (1UL << PMD_SHIFT)209#define PMD_MASK (~(PMD_SIZE-1))210211/* PUD_SHIFT determines what a third-level page table entry can map */212#define PUD_SHIFT (PMD_SHIFT + PMD_INDEX_SIZE)213#define PUD_SIZE (1UL << PUD_SHIFT)214#define PUD_MASK (~(PUD_SIZE-1))215216/* PGDIR_SHIFT determines what a fourth-level page table entry can map */217#define PGDIR_SHIFT (PUD_SHIFT + PUD_INDEX_SIZE)218#define PGDIR_SIZE (1UL << PGDIR_SHIFT)219#define PGDIR_MASK (~(PGDIR_SIZE-1))220221/* Bits to mask out from a PMD to get to the PTE page */222#define PMD_MASKED_BITS 0xc0000000000000ffUL223/* Bits to mask out from a PUD to get to the PMD page */224#define PUD_MASKED_BITS 0xc0000000000000ffUL225/* Bits to mask out from a PGD to get to the PUD page */226#define P4D_MASKED_BITS 0xc0000000000000ffUL227228/*229* Used as an indicator for rcu callback functions230*/231enum pgtable_index {232PTE_INDEX = 0,233PMD_INDEX,234PUD_INDEX,235PGD_INDEX,236/*237* Below are used with 4k page size and hugetlb238*/239HTLB_16M_INDEX,240HTLB_16G_INDEX,241};242243extern unsigned long __vmalloc_start;244extern unsigned long __vmalloc_end;245#define VMALLOC_START __vmalloc_start246#define VMALLOC_END __vmalloc_end247248static inline unsigned int ioremap_max_order(void)249{250if (radix_enabled())251return PUD_SHIFT;252return 7 + PAGE_SHIFT; /* default from linux/vmalloc.h */253}254#define IOREMAP_MAX_ORDER ioremap_max_order()255256extern unsigned long __kernel_virt_start;257extern unsigned long __kernel_io_start;258extern unsigned long __kernel_io_end;259#define KERN_VIRT_START __kernel_virt_start260#define KERN_IO_START __kernel_io_start261#define KERN_IO_END __kernel_io_end262263extern struct page *vmemmap;264extern unsigned long pci_io_base;265266#define pmd_leaf pmd_leaf267static inline bool pmd_leaf(pmd_t pmd)268{269return !!(pmd_raw(pmd) & cpu_to_be64(_PAGE_PTE));270}271272#define pud_leaf pud_leaf273static inline bool pud_leaf(pud_t pud)274{275return !!(pud_raw(pud) & cpu_to_be64(_PAGE_PTE));276}277278#define pmd_leaf_size pmd_leaf_size279static inline unsigned long pmd_leaf_size(pmd_t pmd)280{281if (IS_ENABLED(CONFIG_PPC_4K_PAGES) && !radix_enabled())282return SZ_16M;283else284return PMD_SIZE;285}286287#define pud_leaf_size pud_leaf_size288static inline unsigned long pud_leaf_size(pud_t pud)289{290if (IS_ENABLED(CONFIG_PPC_4K_PAGES) && !radix_enabled())291return SZ_16G;292else293return PUD_SIZE;294}295#endif /* __ASSEMBLER__ */296297#include <asm/book3s/64/hash.h>298#include <asm/book3s/64/radix.h>299300#if H_MAX_PHYSMEM_BITS > R_MAX_PHYSMEM_BITS301#define MAX_PHYSMEM_BITS H_MAX_PHYSMEM_BITS302#else303#define MAX_PHYSMEM_BITS R_MAX_PHYSMEM_BITS304#endif305306/* hash 4k can't share hugetlb and also doesn't support THP */307#ifdef CONFIG_PPC_64K_PAGES308#include <asm/book3s/64/pgtable-64k.h>309#endif310311#include <asm/barrier.h>312/*313* IO space itself carved into the PIO region (ISA and PHB IO space) and314* the ioremap space315*316* ISA_IO_BASE = KERN_IO_START, 64K reserved area317* PHB_IO_BASE = ISA_IO_BASE + 64K to ISA_IO_BASE + 2G, PHB IO spaces318* IOREMAP_BASE = ISA_IO_BASE + 2G to VMALLOC_START + PGTABLE_RANGE319*/320#define FULL_IO_SIZE 0x80000000ul321#define ISA_IO_BASE (KERN_IO_START)322#define ISA_IO_END (KERN_IO_START + 0x10000ul)323#define PHB_IO_BASE (ISA_IO_END)324#define PHB_IO_END (KERN_IO_START + FULL_IO_SIZE)325#define IOREMAP_BASE (PHB_IO_END)326#define IOREMAP_START (ioremap_bot)327#define IOREMAP_END (KERN_IO_END - FIXADDR_SIZE)328#define FIXADDR_SIZE SZ_32M329#define FIXADDR_TOP (IOREMAP_END + FIXADDR_SIZE)330331#ifndef __ASSEMBLER__332333static inline unsigned long pte_update(struct mm_struct *mm, unsigned long addr,334pte_t *ptep, unsigned long clr,335unsigned long set, int huge)336{337if (radix_enabled())338return radix__pte_update(mm, addr, ptep, clr, set, huge);339return hash__pte_update(mm, addr, ptep, clr, set, huge);340}341/*342* For hash even if we have _PAGE_ACCESSED = 0, we do a pte_update.343* We currently remove entries from the hashtable regardless of whether344* the entry was young or dirty.345*346* We should be more intelligent about this but for the moment we override347* these functions and force a tlb flush unconditionally348* For radix: H_PAGE_HASHPTE should be zero. Hence we can use the same349* function for both hash and radix.350*/351static inline int __ptep_test_and_clear_young(struct mm_struct *mm,352unsigned long addr, pte_t *ptep)353{354unsigned long old;355356if ((pte_raw(*ptep) & cpu_to_be64(_PAGE_ACCESSED | H_PAGE_HASHPTE)) == 0)357return 0;358old = pte_update(mm, addr, ptep, _PAGE_ACCESSED, 0, 0);359return (old & _PAGE_ACCESSED) != 0;360}361362#define __HAVE_ARCH_PTEP_TEST_AND_CLEAR_YOUNG363#define ptep_test_and_clear_young(__vma, __addr, __ptep) \364({ \365__ptep_test_and_clear_young((__vma)->vm_mm, __addr, __ptep); \366})367368/*369* On Book3S CPUs, clearing the accessed bit without a TLB flush370* doesn't cause data corruption. [ It could cause incorrect371* page aging and the (mistaken) reclaim of hot pages, but the372* chance of that should be relatively low. ]373*374* So as a performance optimization don't flush the TLB when375* clearing the accessed bit, it will eventually be flushed by376* a context switch or a VM operation anyway. [ In the rare377* event of it not getting flushed for a long time the delay378* shouldn't really matter because there's no real memory379* pressure for swapout to react to. ]380*381* Note: this optimisation also exists in pte_needs_flush() and382* huge_pmd_needs_flush().383*/384#define __HAVE_ARCH_PTEP_CLEAR_YOUNG_FLUSH385#define ptep_clear_flush_young ptep_test_and_clear_young386387#define __HAVE_ARCH_PMDP_CLEAR_YOUNG_FLUSH388#define pmdp_clear_flush_young pmdp_test_and_clear_young389390static inline int pte_write(pte_t pte)391{392return !!(pte_raw(pte) & cpu_to_be64(_PAGE_WRITE));393}394395static inline int pte_read(pte_t pte)396{397return !!(pte_raw(pte) & cpu_to_be64(_PAGE_READ));398}399400#define __HAVE_ARCH_PTEP_SET_WRPROTECT401static inline void ptep_set_wrprotect(struct mm_struct *mm, unsigned long addr,402pte_t *ptep)403{404if (pte_write(*ptep))405pte_update(mm, addr, ptep, _PAGE_WRITE, 0, 0);406}407408#define __HAVE_ARCH_HUGE_PTEP_SET_WRPROTECT409static inline void huge_ptep_set_wrprotect(struct mm_struct *mm,410unsigned long addr, pte_t *ptep)411{412if (pte_write(*ptep))413pte_update(mm, addr, ptep, _PAGE_WRITE, 0, 1);414}415416#define __HAVE_ARCH_PTEP_GET_AND_CLEAR417static inline pte_t ptep_get_and_clear(struct mm_struct *mm,418unsigned long addr, pte_t *ptep)419{420pte_t old_pte = __pte(pte_update(mm, addr, ptep, ~0UL, 0, 0));421422page_table_check_pte_clear(mm, addr, old_pte);423424return old_pte;425}426427#define __HAVE_ARCH_PTEP_GET_AND_CLEAR_FULL428static inline pte_t ptep_get_and_clear_full(struct mm_struct *mm,429unsigned long addr,430pte_t *ptep, int full)431{432if (full && radix_enabled()) {433pte_t old_pte;434435/*436* We know that this is a full mm pte clear and437* hence can be sure there is no parallel set_pte.438*/439old_pte = radix__ptep_get_and_clear_full(mm, addr, ptep, full);440page_table_check_pte_clear(mm, addr, old_pte);441442return old_pte;443}444return ptep_get_and_clear(mm, addr, ptep);445}446447448static inline void pte_clear(struct mm_struct *mm, unsigned long addr,449pte_t * ptep)450{451pte_update(mm, addr, ptep, ~0UL, 0, 0);452}453454static inline int pte_dirty(pte_t pte)455{456return !!(pte_raw(pte) & cpu_to_be64(_PAGE_DIRTY));457}458459static inline int pte_young(pte_t pte)460{461return !!(pte_raw(pte) & cpu_to_be64(_PAGE_ACCESSED));462}463464static inline int pte_special(pte_t pte)465{466return !!(pte_raw(pte) & cpu_to_be64(_PAGE_SPECIAL));467}468469static inline bool pte_exec(pte_t pte)470{471return !!(pte_raw(pte) & cpu_to_be64(_PAGE_EXEC));472}473474475#ifdef CONFIG_HAVE_ARCH_SOFT_DIRTY476static inline bool pte_soft_dirty(pte_t pte)477{478return !!(pte_raw(pte) & cpu_to_be64(_PAGE_SOFT_DIRTY));479}480481static inline pte_t pte_mksoft_dirty(pte_t pte)482{483return __pte_raw(pte_raw(pte) | cpu_to_be64(_PAGE_SOFT_DIRTY));484}485486static inline pte_t pte_clear_soft_dirty(pte_t pte)487{488return __pte_raw(pte_raw(pte) & cpu_to_be64(~_PAGE_SOFT_DIRTY));489}490#endif /* CONFIG_HAVE_ARCH_SOFT_DIRTY */491492#ifdef CONFIG_NUMA_BALANCING493static inline int pte_protnone(pte_t pte)494{495return (pte_raw(pte) & cpu_to_be64(_PAGE_PRESENT | _PAGE_PTE | _PAGE_RWX)) ==496cpu_to_be64(_PAGE_PRESENT | _PAGE_PTE);497}498#endif /* CONFIG_NUMA_BALANCING */499500static inline bool pte_hw_valid(pte_t pte)501{502return (pte_raw(pte) & cpu_to_be64(_PAGE_PRESENT | _PAGE_PTE)) ==503cpu_to_be64(_PAGE_PRESENT | _PAGE_PTE);504}505506static inline int pte_present(pte_t pte)507{508/*509* A pte is considerent present if _PAGE_PRESENT is set.510* We also need to consider the pte present which is marked511* invalid during ptep_set_access_flags. Hence we look for _PAGE_INVALID512* if we find _PAGE_PRESENT cleared.513*/514515if (pte_hw_valid(pte))516return true;517return (pte_raw(pte) & cpu_to_be64(_PAGE_INVALID | _PAGE_PTE)) ==518cpu_to_be64(_PAGE_INVALID | _PAGE_PTE);519}520521#ifdef CONFIG_PPC_MEM_KEYS522extern bool arch_pte_access_permitted(u64 pte, bool write, bool execute);523#else524static inline bool arch_pte_access_permitted(u64 pte, bool write, bool execute)525{526return true;527}528#endif /* CONFIG_PPC_MEM_KEYS */529530static inline bool pte_user(pte_t pte)531{532return !(pte_raw(pte) & cpu_to_be64(_PAGE_PRIVILEGED));533}534535#define pte_access_permitted pte_access_permitted536static inline bool pte_access_permitted(pte_t pte, bool write)537{538/*539* _PAGE_READ is needed for any access and will be cleared for540* PROT_NONE. Execute-only mapping via PROT_EXEC also returns false.541*/542if (!pte_present(pte) || !pte_user(pte) || !pte_read(pte))543return false;544545if (write && !pte_write(pte))546return false;547548return arch_pte_access_permitted(pte_val(pte), write, 0);549}550551static inline bool pte_user_accessible_page(pte_t pte, unsigned long addr)552{553return pte_present(pte) && pte_user(pte);554}555556/*557* Conversion functions: convert a page and protection to a page entry,558* and a page entry and page directory to the page they refer to.559*560* Even if PTEs can be unsigned long long, a PFN is always an unsigned561* long for now.562*/563static inline pte_t pfn_pte(unsigned long pfn, pgprot_t pgprot)564{565VM_BUG_ON(pfn >> (64 - PAGE_SHIFT));566VM_BUG_ON((pfn << PAGE_SHIFT) & ~PTE_RPN_MASK);567568return __pte(((pte_basic_t)pfn << PAGE_SHIFT) | pgprot_val(pgprot) | _PAGE_PTE);569}570571/* Generic modifiers for PTE bits */572static inline pte_t pte_wrprotect(pte_t pte)573{574return __pte_raw(pte_raw(pte) & cpu_to_be64(~_PAGE_WRITE));575}576577static inline pte_t pte_exprotect(pte_t pte)578{579return __pte_raw(pte_raw(pte) & cpu_to_be64(~_PAGE_EXEC));580}581582static inline pte_t pte_mkclean(pte_t pte)583{584return __pte_raw(pte_raw(pte) & cpu_to_be64(~_PAGE_DIRTY));585}586587static inline pte_t pte_mkold(pte_t pte)588{589return __pte_raw(pte_raw(pte) & cpu_to_be64(~_PAGE_ACCESSED));590}591592static inline pte_t pte_mkexec(pte_t pte)593{594return __pte_raw(pte_raw(pte) | cpu_to_be64(_PAGE_EXEC));595}596597static inline pte_t pte_mkwrite_novma(pte_t pte)598{599/*600* write implies read, hence set both601*/602return __pte_raw(pte_raw(pte) | cpu_to_be64(_PAGE_RW));603}604605static inline pte_t pte_mkdirty(pte_t pte)606{607return __pte_raw(pte_raw(pte) | cpu_to_be64(_PAGE_DIRTY | _PAGE_SOFT_DIRTY));608}609610static inline pte_t pte_mkyoung(pte_t pte)611{612return __pte_raw(pte_raw(pte) | cpu_to_be64(_PAGE_ACCESSED));613}614615static inline pte_t pte_mkspecial(pte_t pte)616{617return __pte_raw(pte_raw(pte) | cpu_to_be64(_PAGE_SPECIAL));618}619620static inline pte_t pte_mkhuge(pte_t pte)621{622return pte;623}624625static inline pte_t pte_modify(pte_t pte, pgprot_t newprot)626{627/* FIXME!! check whether this need to be a conditional */628return __pte_raw((pte_raw(pte) & cpu_to_be64(_PAGE_CHG_MASK)) |629cpu_to_be64(pgprot_val(newprot)));630}631632/* Encode and de-code a swap entry */633#define MAX_SWAPFILES_CHECK() do { \634BUILD_BUG_ON(MAX_SWAPFILES_SHIFT > SWP_TYPE_BITS); \635/* \636* Don't have overlapping bits with _PAGE_HPTEFLAGS \637* We filter HPTEFLAGS on set_pte. \638*/ \639BUILD_BUG_ON(_PAGE_HPTEFLAGS & SWP_TYPE_MASK); \640BUILD_BUG_ON(_PAGE_HPTEFLAGS & _PAGE_SWP_SOFT_DIRTY); \641BUILD_BUG_ON(_PAGE_HPTEFLAGS & _PAGE_SWP_EXCLUSIVE); \642} while (0)643644#define SWP_TYPE_BITS 5645#define SWP_TYPE_MASK ((1UL << SWP_TYPE_BITS) - 1)646#define __swp_type(x) ((x).val & SWP_TYPE_MASK)647#define __swp_offset(x) (((x).val & PTE_RPN_MASK) >> PAGE_SHIFT)648#define __swp_entry(type, offset) ((swp_entry_t) { \649(type) | (((offset) << PAGE_SHIFT) & PTE_RPN_MASK)})650/*651* swp_entry_t must be independent of pte bits. We build a swp_entry_t from652* swap type and offset we get from swap and convert that to pte to find a653* matching pte in linux page table.654* Clear bits not found in swap entries here.655*/656#define __pte_to_swp_entry(pte) ((swp_entry_t) { pte_val((pte)) & ~_PAGE_PTE })657#define __swp_entry_to_pte(x) __pte((x).val | _PAGE_PTE)658#define __pmd_to_swp_entry(pmd) (__pte_to_swp_entry(pmd_pte(pmd)))659#define __swp_entry_to_pmd(x) (pte_pmd(__swp_entry_to_pte(x)))660661#ifdef CONFIG_MEM_SOFT_DIRTY662#define _PAGE_SWP_SOFT_DIRTY _PAGE_SOFT_DIRTY663#else664#define _PAGE_SWP_SOFT_DIRTY 0UL665#endif /* CONFIG_MEM_SOFT_DIRTY */666667#define _PAGE_SWP_EXCLUSIVE _PAGE_NON_IDEMPOTENT668669#ifdef CONFIG_HAVE_ARCH_SOFT_DIRTY670static inline pte_t pte_swp_mksoft_dirty(pte_t pte)671{672return __pte_raw(pte_raw(pte) | cpu_to_be64(_PAGE_SWP_SOFT_DIRTY));673}674675static inline bool pte_swp_soft_dirty(pte_t pte)676{677return !!(pte_raw(pte) & cpu_to_be64(_PAGE_SWP_SOFT_DIRTY));678}679680static inline pte_t pte_swp_clear_soft_dirty(pte_t pte)681{682return __pte_raw(pte_raw(pte) & cpu_to_be64(~_PAGE_SWP_SOFT_DIRTY));683}684#endif /* CONFIG_HAVE_ARCH_SOFT_DIRTY */685686static inline pte_t pte_swp_mkexclusive(pte_t pte)687{688return __pte_raw(pte_raw(pte) | cpu_to_be64(_PAGE_SWP_EXCLUSIVE));689}690691static inline bool pte_swp_exclusive(pte_t pte)692{693return !!(pte_raw(pte) & cpu_to_be64(_PAGE_SWP_EXCLUSIVE));694}695696static inline pte_t pte_swp_clear_exclusive(pte_t pte)697{698return __pte_raw(pte_raw(pte) & cpu_to_be64(~_PAGE_SWP_EXCLUSIVE));699}700701static inline bool check_pte_access(unsigned long access, unsigned long ptev)702{703/*704* This check for _PAGE_RWX and _PAGE_PRESENT bits705*/706if (access & ~ptev)707return false;708/*709* This check for access to privilege space710*/711if ((access & _PAGE_PRIVILEGED) != (ptev & _PAGE_PRIVILEGED))712return false;713714return true;715}716/*717* Generic functions with hash/radix callbacks718*/719720static inline void __ptep_set_access_flags(struct vm_area_struct *vma,721pte_t *ptep, pte_t entry,722unsigned long address,723int psize)724{725if (radix_enabled())726return radix__ptep_set_access_flags(vma, ptep, entry,727address, psize);728return hash__ptep_set_access_flags(ptep, entry);729}730731#define __HAVE_ARCH_PTE_SAME732static inline int pte_same(pte_t pte_a, pte_t pte_b)733{734if (radix_enabled())735return radix__pte_same(pte_a, pte_b);736return hash__pte_same(pte_a, pte_b);737}738739static inline int pte_none(pte_t pte)740{741if (radix_enabled())742return radix__pte_none(pte);743return hash__pte_none(pte);744}745746static inline void __set_pte_at(struct mm_struct *mm, unsigned long addr,747pte_t *ptep, pte_t pte, int percpu)748{749750VM_WARN_ON(!(pte_raw(pte) & cpu_to_be64(_PAGE_PTE)));751/*752* Keep the _PAGE_PTE added till we are sure we handle _PAGE_PTE753* in all the callers.754*/755pte = __pte_raw(pte_raw(pte) | cpu_to_be64(_PAGE_PTE));756757if (radix_enabled())758return radix__set_pte_at(mm, addr, ptep, pte, percpu);759return hash__set_pte_at(mm, addr, ptep, pte, percpu);760}761762#define _PAGE_CACHE_CTL (_PAGE_SAO | _PAGE_NON_IDEMPOTENT | _PAGE_TOLERANT)763764#define pgprot_noncached pgprot_noncached765static inline pgprot_t pgprot_noncached(pgprot_t prot)766{767return __pgprot((pgprot_val(prot) & ~_PAGE_CACHE_CTL) |768_PAGE_NON_IDEMPOTENT);769}770771#define pgprot_noncached_wc pgprot_noncached_wc772static inline pgprot_t pgprot_noncached_wc(pgprot_t prot)773{774return __pgprot((pgprot_val(prot) & ~_PAGE_CACHE_CTL) |775_PAGE_TOLERANT);776}777778#define pgprot_cached pgprot_cached779static inline pgprot_t pgprot_cached(pgprot_t prot)780{781return __pgprot((pgprot_val(prot) & ~_PAGE_CACHE_CTL));782}783784#define pgprot_writecombine pgprot_writecombine785static inline pgprot_t pgprot_writecombine(pgprot_t prot)786{787return pgprot_noncached_wc(prot);788}789/*790* check a pte mapping have cache inhibited property791*/792static inline bool pte_ci(pte_t pte)793{794__be64 pte_v = pte_raw(pte);795796if (((pte_v & cpu_to_be64(_PAGE_CACHE_CTL)) == cpu_to_be64(_PAGE_TOLERANT)) ||797((pte_v & cpu_to_be64(_PAGE_CACHE_CTL)) == cpu_to_be64(_PAGE_NON_IDEMPOTENT)))798return true;799return false;800}801802static inline void pmd_clear(pmd_t *pmdp)803{804if (IS_ENABLED(CONFIG_DEBUG_VM) && !radix_enabled()) {805/*806* Don't use this if we can possibly have a hash page table807* entry mapping this.808*/809WARN_ON((pmd_val(*pmdp) & (H_PAGE_HASHPTE | _PAGE_PTE)) == (H_PAGE_HASHPTE | _PAGE_PTE));810}811*pmdp = __pmd(0);812}813814static inline int pmd_none(pmd_t pmd)815{816return !pmd_raw(pmd);817}818819static inline int pmd_present(pmd_t pmd)820{821/*822* A pmd is considerent present if _PAGE_PRESENT is set.823* We also need to consider the pmd present which is marked824* invalid during a split. Hence we look for _PAGE_INVALID825* if we find _PAGE_PRESENT cleared.826*/827if (pmd_raw(pmd) & cpu_to_be64(_PAGE_PRESENT | _PAGE_INVALID))828return true;829830return false;831}832833static inline int pmd_is_serializing(pmd_t pmd)834{835/*836* If the pmd is undergoing a split, the _PAGE_PRESENT bit is clear837* and _PAGE_INVALID is set (see pmd_present, pmdp_invalidate).838*839* This condition may also occur when flushing a pmd while flushing840* it (see ptep_modify_prot_start), so callers must ensure this841* case is fine as well.842*/843if ((pmd_raw(pmd) & cpu_to_be64(_PAGE_PRESENT | _PAGE_INVALID)) ==844cpu_to_be64(_PAGE_INVALID))845return true;846847return false;848}849850static inline int pmd_bad(pmd_t pmd)851{852if (radix_enabled())853return radix__pmd_bad(pmd);854return hash__pmd_bad(pmd);855}856857static inline void pud_clear(pud_t *pudp)858{859if (IS_ENABLED(CONFIG_DEBUG_VM) && !radix_enabled()) {860/*861* Don't use this if we can possibly have a hash page table862* entry mapping this.863*/864WARN_ON((pud_val(*pudp) & (H_PAGE_HASHPTE | _PAGE_PTE)) == (H_PAGE_HASHPTE | _PAGE_PTE));865}866*pudp = __pud(0);867}868869static inline int pud_none(pud_t pud)870{871return !pud_raw(pud);872}873874static inline int pud_present(pud_t pud)875{876return !!(pud_raw(pud) & cpu_to_be64(_PAGE_PRESENT));877}878879extern struct page *pud_page(pud_t pud);880extern struct page *pmd_page(pmd_t pmd);881static inline pte_t pud_pte(pud_t pud)882{883return __pte_raw(pud_raw(pud));884}885886static inline pud_t pte_pud(pte_t pte)887{888return __pud_raw(pte_raw(pte));889}890891static inline pte_t *pudp_ptep(pud_t *pud)892{893return (pte_t *)pud;894}895896#define pud_pfn(pud) pte_pfn(pud_pte(pud))897#define pud_dirty(pud) pte_dirty(pud_pte(pud))898#define pud_young(pud) pte_young(pud_pte(pud))899#define pud_mkold(pud) pte_pud(pte_mkold(pud_pte(pud)))900#define pud_wrprotect(pud) pte_pud(pte_wrprotect(pud_pte(pud)))901#define pud_mkdirty(pud) pte_pud(pte_mkdirty(pud_pte(pud)))902#define pud_mkclean(pud) pte_pud(pte_mkclean(pud_pte(pud)))903#define pud_mkyoung(pud) pte_pud(pte_mkyoung(pud_pte(pud)))904#define pud_mkwrite(pud) pte_pud(pte_mkwrite_novma(pud_pte(pud)))905#define pud_write(pud) pte_write(pud_pte(pud))906907#ifdef CONFIG_HAVE_ARCH_SOFT_DIRTY908#define pud_soft_dirty(pmd) pte_soft_dirty(pud_pte(pud))909#define pud_mksoft_dirty(pmd) pte_pud(pte_mksoft_dirty(pud_pte(pud)))910#define pud_clear_soft_dirty(pmd) pte_pud(pte_clear_soft_dirty(pud_pte(pud)))911#endif /* CONFIG_HAVE_ARCH_SOFT_DIRTY */912913static inline int pud_bad(pud_t pud)914{915if (radix_enabled())916return radix__pud_bad(pud);917return hash__pud_bad(pud);918}919920#define pud_access_permitted pud_access_permitted921static inline bool pud_access_permitted(pud_t pud, bool write)922{923return pte_access_permitted(pud_pte(pud), write);924}925926#define pud_user_accessible_page pud_user_accessible_page927static inline bool pud_user_accessible_page(pud_t pud, unsigned long addr)928{929return pud_leaf(pud) && pte_user_accessible_page(pud_pte(pud), addr);930}931932#define __p4d_raw(x) ((p4d_t) { __pgd_raw(x) })933static inline __be64 p4d_raw(p4d_t x)934{935return pgd_raw(x.pgd);936}937938#define p4d_write(p4d) pte_write(p4d_pte(p4d))939940static inline void p4d_clear(p4d_t *p4dp)941{942*p4dp = __p4d(0);943}944945static inline int p4d_none(p4d_t p4d)946{947return !p4d_raw(p4d);948}949950static inline int p4d_present(p4d_t p4d)951{952return !!(p4d_raw(p4d) & cpu_to_be64(_PAGE_PRESENT));953}954955static inline pte_t p4d_pte(p4d_t p4d)956{957return __pte_raw(p4d_raw(p4d));958}959960static inline p4d_t pte_p4d(pte_t pte)961{962return __p4d_raw(pte_raw(pte));963}964965static inline int p4d_bad(p4d_t p4d)966{967if (radix_enabled())968return radix__p4d_bad(p4d);969return hash__p4d_bad(p4d);970}971972#define p4d_access_permitted p4d_access_permitted973static inline bool p4d_access_permitted(p4d_t p4d, bool write)974{975return pte_access_permitted(p4d_pte(p4d), write);976}977978extern struct page *p4d_page(p4d_t p4d);979980/* Pointers in the page table tree are physical addresses */981#define __pgtable_ptr_val(ptr) __pa(ptr)982983static inline pud_t *p4d_pgtable(p4d_t p4d)984{985return (pud_t *)__va(p4d_val(p4d) & ~P4D_MASKED_BITS);986}987988static inline pmd_t *pud_pgtable(pud_t pud)989{990return (pmd_t *)__va(pud_val(pud) & ~PUD_MASKED_BITS);991}992993#define pmd_ERROR(e) \994pr_err("%s:%d: bad pmd %08lx.\n", __FILE__, __LINE__, pmd_val(e))995#define pud_ERROR(e) \996pr_err("%s:%d: bad pud %08lx.\n", __FILE__, __LINE__, pud_val(e))997#define pgd_ERROR(e) \998pr_err("%s:%d: bad pgd %08lx.\n", __FILE__, __LINE__, pgd_val(e))9991000static inline int map_kernel_page(unsigned long ea, unsigned long pa, pgprot_t prot)1001{1002if (radix_enabled()) {1003#if defined(CONFIG_PPC_RADIX_MMU) && defined(DEBUG_VM)1004unsigned long page_size = 1 << mmu_psize_defs[mmu_io_psize].shift;1005WARN((page_size != PAGE_SIZE), "I/O page size != PAGE_SIZE");1006#endif1007return radix__map_kernel_page(ea, pa, prot, PAGE_SIZE);1008}1009return hash__map_kernel_page(ea, pa, prot);1010}10111012void unmap_kernel_page(unsigned long va);10131014static inline int __meminit vmemmap_create_mapping(unsigned long start,1015unsigned long page_size,1016unsigned long phys)1017{1018if (radix_enabled())1019return radix__vmemmap_create_mapping(start, page_size, phys);1020return hash__vmemmap_create_mapping(start, page_size, phys);1021}10221023#ifdef CONFIG_MEMORY_HOTPLUG1024static inline void vmemmap_remove_mapping(unsigned long start,1025unsigned long page_size)1026{1027if (radix_enabled())1028return radix__vmemmap_remove_mapping(start, page_size);1029return hash__vmemmap_remove_mapping(start, page_size);1030}1031#endif10321033static inline pte_t pmd_pte(pmd_t pmd)1034{1035return __pte_raw(pmd_raw(pmd));1036}10371038static inline pmd_t pte_pmd(pte_t pte)1039{1040return __pmd_raw(pte_raw(pte));1041}10421043static inline pte_t *pmdp_ptep(pmd_t *pmd)1044{1045return (pte_t *)pmd;1046}1047#define pmd_pfn(pmd) pte_pfn(pmd_pte(pmd))1048#define pmd_dirty(pmd) pte_dirty(pmd_pte(pmd))1049#define pmd_young(pmd) pte_young(pmd_pte(pmd))1050#define pmd_mkold(pmd) pte_pmd(pte_mkold(pmd_pte(pmd)))1051#define pmd_wrprotect(pmd) pte_pmd(pte_wrprotect(pmd_pte(pmd)))1052#define pmd_mkdirty(pmd) pte_pmd(pte_mkdirty(pmd_pte(pmd)))1053#define pmd_mkclean(pmd) pte_pmd(pte_mkclean(pmd_pte(pmd)))1054#define pmd_mkyoung(pmd) pte_pmd(pte_mkyoung(pmd_pte(pmd)))1055#define pmd_mkwrite_novma(pmd) pte_pmd(pte_mkwrite_novma(pmd_pte(pmd)))10561057#ifdef CONFIG_HAVE_ARCH_SOFT_DIRTY1058#define pmd_soft_dirty(pmd) pte_soft_dirty(pmd_pte(pmd))1059#define pmd_mksoft_dirty(pmd) pte_pmd(pte_mksoft_dirty(pmd_pte(pmd)))1060#define pmd_clear_soft_dirty(pmd) pte_pmd(pte_clear_soft_dirty(pmd_pte(pmd)))10611062#ifdef CONFIG_ARCH_ENABLE_THP_MIGRATION1063#define pmd_swp_mksoft_dirty(pmd) pte_pmd(pte_swp_mksoft_dirty(pmd_pte(pmd)))1064#define pmd_swp_soft_dirty(pmd) pte_swp_soft_dirty(pmd_pte(pmd))1065#define pmd_swp_clear_soft_dirty(pmd) pte_pmd(pte_swp_clear_soft_dirty(pmd_pte(pmd)))1066#endif1067#endif /* CONFIG_HAVE_ARCH_SOFT_DIRTY */10681069#ifdef CONFIG_NUMA_BALANCING1070static inline int pmd_protnone(pmd_t pmd)1071{1072return pte_protnone(pmd_pte(pmd));1073}1074#endif /* CONFIG_NUMA_BALANCING */10751076#define pmd_write(pmd) pte_write(pmd_pte(pmd))10771078#define pmd_access_permitted pmd_access_permitted1079static inline bool pmd_access_permitted(pmd_t pmd, bool write)1080{1081/*1082* pmdp_invalidate sets this combination (which is not caught by1083* !pte_present() check in pte_access_permitted), to prevent1084* lock-free lookups, as part of the serialize_against_pte_lookup()1085* synchronisation.1086*1087* This also catches the case where the PTE's hardware PRESENT bit is1088* cleared while TLB is flushed, which is suboptimal but should not1089* be frequent.1090*/1091if (pmd_is_serializing(pmd))1092return false;10931094return pte_access_permitted(pmd_pte(pmd), write);1095}10961097#define pmd_user_accessible_page pmd_user_accessible_page1098static inline bool pmd_user_accessible_page(pmd_t pmd, unsigned long addr)1099{1100return pmd_leaf(pmd) && pte_user_accessible_page(pmd_pte(pmd), addr);1101}11021103#ifdef CONFIG_TRANSPARENT_HUGEPAGE1104extern pmd_t pfn_pmd(unsigned long pfn, pgprot_t pgprot);1105extern pud_t pfn_pud(unsigned long pfn, pgprot_t pgprot);1106extern pmd_t pmd_modify(pmd_t pmd, pgprot_t newprot);1107extern pud_t pud_modify(pud_t pud, pgprot_t newprot);1108extern void set_pmd_at(struct mm_struct *mm, unsigned long addr,1109pmd_t *pmdp, pmd_t pmd);1110extern void set_pud_at(struct mm_struct *mm, unsigned long addr,1111pud_t *pudp, pud_t pud);11121113static inline void update_mmu_cache_pmd(struct vm_area_struct *vma,1114unsigned long addr, pmd_t *pmd)1115{1116}11171118static inline void update_mmu_cache_pud(struct vm_area_struct *vma,1119unsigned long addr, pud_t *pud)1120{1121}11221123extern int hash__has_transparent_hugepage(void);1124static inline int has_transparent_hugepage(void)1125{1126if (radix_enabled())1127return radix__has_transparent_hugepage();1128return hash__has_transparent_hugepage();1129}1130#define has_transparent_hugepage has_transparent_hugepage11311132static inline int has_transparent_pud_hugepage(void)1133{1134if (radix_enabled())1135return radix__has_transparent_pud_hugepage();1136return 0;1137}1138#define has_transparent_pud_hugepage has_transparent_pud_hugepage11391140static inline unsigned long1141pmd_hugepage_update(struct mm_struct *mm, unsigned long addr, pmd_t *pmdp,1142unsigned long clr, unsigned long set)1143{1144if (radix_enabled())1145return radix__pmd_hugepage_update(mm, addr, pmdp, clr, set);1146return hash__pmd_hugepage_update(mm, addr, pmdp, clr, set);1147}11481149static inline unsigned long1150pud_hugepage_update(struct mm_struct *mm, unsigned long addr, pud_t *pudp,1151unsigned long clr, unsigned long set)1152{1153if (radix_enabled())1154return radix__pud_hugepage_update(mm, addr, pudp, clr, set);1155BUG();1156return pud_val(*pudp);1157}11581159/*1160* For radix we should always find H_PAGE_HASHPTE zero. Hence1161* the below will work for radix too1162*/1163static inline int __pmdp_test_and_clear_young(struct mm_struct *mm,1164unsigned long addr, pmd_t *pmdp)1165{1166unsigned long old;11671168if ((pmd_raw(*pmdp) & cpu_to_be64(_PAGE_ACCESSED | H_PAGE_HASHPTE)) == 0)1169return 0;1170old = pmd_hugepage_update(mm, addr, pmdp, _PAGE_ACCESSED, 0);1171return ((old & _PAGE_ACCESSED) != 0);1172}11731174static inline int __pudp_test_and_clear_young(struct mm_struct *mm,1175unsigned long addr, pud_t *pudp)1176{1177unsigned long old;11781179if ((pud_raw(*pudp) & cpu_to_be64(_PAGE_ACCESSED | H_PAGE_HASHPTE)) == 0)1180return 0;1181old = pud_hugepage_update(mm, addr, pudp, _PAGE_ACCESSED, 0);1182return ((old & _PAGE_ACCESSED) != 0);1183}11841185#define __HAVE_ARCH_PMDP_SET_WRPROTECT1186static inline void pmdp_set_wrprotect(struct mm_struct *mm, unsigned long addr,1187pmd_t *pmdp)1188{1189if (pmd_write(*pmdp))1190pmd_hugepage_update(mm, addr, pmdp, _PAGE_WRITE, 0);1191}11921193#define __HAVE_ARCH_PUDP_SET_WRPROTECT1194static inline void pudp_set_wrprotect(struct mm_struct *mm, unsigned long addr,1195pud_t *pudp)1196{1197if (pud_write(*pudp))1198pud_hugepage_update(mm, addr, pudp, _PAGE_WRITE, 0);1199}12001201/*1202* Only returns true for a THP. False for pmd migration entry.1203* We also need to return true when we come across a pte that1204* in between a thp split. While splitting THP, we mark the pmd1205* invalid (pmdp_invalidate()) before we set it with pte page1206* address. A pmd_trans_huge() check against a pmd entry during that time1207* should return true.1208* We should not call this on a hugetlb entry. We should check for HugeTLB1209* entry using vma->vm_flags1210* The page table walk rule is explained in Documentation/mm/transhuge.rst1211*/1212static inline int pmd_trans_huge(pmd_t pmd)1213{1214if (!pmd_present(pmd))1215return false;12161217if (radix_enabled())1218return radix__pmd_trans_huge(pmd);1219return hash__pmd_trans_huge(pmd);1220}12211222static inline int pud_trans_huge(pud_t pud)1223{1224if (!pud_present(pud))1225return false;12261227if (radix_enabled())1228return radix__pud_trans_huge(pud);1229return 0;1230}123112321233#define __HAVE_ARCH_PMD_SAME1234static inline int pmd_same(pmd_t pmd_a, pmd_t pmd_b)1235{1236if (radix_enabled())1237return radix__pmd_same(pmd_a, pmd_b);1238return hash__pmd_same(pmd_a, pmd_b);1239}12401241#define pud_same pud_same1242static inline int pud_same(pud_t pud_a, pud_t pud_b)1243{1244if (radix_enabled())1245return radix__pud_same(pud_a, pud_b);1246return hash__pud_same(pud_a, pud_b);1247}124812491250static inline pmd_t __pmd_mkhuge(pmd_t pmd)1251{1252if (radix_enabled())1253return radix__pmd_mkhuge(pmd);1254return hash__pmd_mkhuge(pmd);1255}12561257static inline pud_t __pud_mkhuge(pud_t pud)1258{1259if (radix_enabled())1260return radix__pud_mkhuge(pud);1261BUG();1262return pud;1263}12641265/*1266* pfn_pmd return a pmd_t that can be used as pmd pte entry.1267*/1268static inline pmd_t pmd_mkhuge(pmd_t pmd)1269{1270#ifdef CONFIG_DEBUG_VM1271if (radix_enabled())1272WARN_ON((pmd_raw(pmd) & cpu_to_be64(_PAGE_PTE)) == 0);1273else1274WARN_ON((pmd_raw(pmd) & cpu_to_be64(_PAGE_PTE | H_PAGE_THP_HUGE)) !=1275cpu_to_be64(_PAGE_PTE | H_PAGE_THP_HUGE));1276#endif1277return pmd;1278}12791280static inline pud_t pud_mkhuge(pud_t pud)1281{1282#ifdef CONFIG_DEBUG_VM1283if (radix_enabled())1284WARN_ON((pud_raw(pud) & cpu_to_be64(_PAGE_PTE)) == 0);1285else1286WARN_ON(1);1287#endif1288return pud;1289}129012911292#define __HAVE_ARCH_PMDP_SET_ACCESS_FLAGS1293extern int pmdp_set_access_flags(struct vm_area_struct *vma,1294unsigned long address, pmd_t *pmdp,1295pmd_t entry, int dirty);1296#define __HAVE_ARCH_PUDP_SET_ACCESS_FLAGS1297extern int pudp_set_access_flags(struct vm_area_struct *vma,1298unsigned long address, pud_t *pudp,1299pud_t entry, int dirty);13001301#define __HAVE_ARCH_PMDP_TEST_AND_CLEAR_YOUNG1302extern int pmdp_test_and_clear_young(struct vm_area_struct *vma,1303unsigned long address, pmd_t *pmdp);1304#define __HAVE_ARCH_PUDP_TEST_AND_CLEAR_YOUNG1305extern int pudp_test_and_clear_young(struct vm_area_struct *vma,1306unsigned long address, pud_t *pudp);130713081309#define __HAVE_ARCH_PMDP_HUGE_GET_AND_CLEAR1310static inline pmd_t pmdp_huge_get_and_clear(struct mm_struct *mm,1311unsigned long addr, pmd_t *pmdp)1312{1313pmd_t old_pmd;13141315if (radix_enabled()) {1316old_pmd = radix__pmdp_huge_get_and_clear(mm, addr, pmdp);1317} else {1318old_pmd = hash__pmdp_huge_get_and_clear(mm, addr, pmdp);1319}13201321page_table_check_pmd_clear(mm, addr, old_pmd);13221323return old_pmd;1324}13251326#define __HAVE_ARCH_PUDP_HUGE_GET_AND_CLEAR1327static inline pud_t pudp_huge_get_and_clear(struct mm_struct *mm,1328unsigned long addr, pud_t *pudp)1329{1330pud_t old_pud;13311332if (radix_enabled()) {1333old_pud = radix__pudp_huge_get_and_clear(mm, addr, pudp);1334} else {1335BUG();1336}13371338page_table_check_pud_clear(mm, addr, old_pud);13391340return old_pud;1341}13421343static inline pmd_t pmdp_collapse_flush(struct vm_area_struct *vma,1344unsigned long address, pmd_t *pmdp)1345{1346if (radix_enabled())1347return radix__pmdp_collapse_flush(vma, address, pmdp);1348return hash__pmdp_collapse_flush(vma, address, pmdp);1349}1350#define pmdp_collapse_flush pmdp_collapse_flush13511352#define __HAVE_ARCH_PMDP_HUGE_GET_AND_CLEAR_FULL1353pmd_t pmdp_huge_get_and_clear_full(struct vm_area_struct *vma,1354unsigned long addr,1355pmd_t *pmdp, int full);13561357#define __HAVE_ARCH_PUDP_HUGE_GET_AND_CLEAR_FULL1358pud_t pudp_huge_get_and_clear_full(struct vm_area_struct *vma,1359unsigned long addr,1360pud_t *pudp, int full);13611362#define __HAVE_ARCH_PGTABLE_DEPOSIT1363static inline void pgtable_trans_huge_deposit(struct mm_struct *mm,1364pmd_t *pmdp, pgtable_t pgtable)1365{1366if (radix_enabled())1367return radix__pgtable_trans_huge_deposit(mm, pmdp, pgtable);1368return hash__pgtable_trans_huge_deposit(mm, pmdp, pgtable);1369}13701371#define __HAVE_ARCH_PGTABLE_WITHDRAW1372static inline pgtable_t pgtable_trans_huge_withdraw(struct mm_struct *mm,1373pmd_t *pmdp)1374{1375if (radix_enabled())1376return radix__pgtable_trans_huge_withdraw(mm, pmdp);1377return hash__pgtable_trans_huge_withdraw(mm, pmdp);1378}13791380#define __HAVE_ARCH_PMDP_INVALIDATE1381extern pmd_t pmdp_invalidate(struct vm_area_struct *vma, unsigned long address,1382pmd_t *pmdp);1383extern pud_t pudp_invalidate(struct vm_area_struct *vma, unsigned long address,1384pud_t *pudp);13851386#define pmd_move_must_withdraw pmd_move_must_withdraw1387struct spinlock;1388extern int pmd_move_must_withdraw(struct spinlock *new_pmd_ptl,1389struct spinlock *old_pmd_ptl,1390struct vm_area_struct *vma);1391/*1392* Hash translation mode use the deposited table to store hash pte1393* slot information.1394*/1395#define arch_needs_pgtable_deposit arch_needs_pgtable_deposit1396static inline bool arch_needs_pgtable_deposit(void)1397{1398if (radix_enabled())1399return false;1400return true;1401}1402extern void serialize_against_pte_lookup(struct mm_struct *mm);14031404#endif /* CONFIG_TRANSPARENT_HUGEPAGE */14051406#define __HAVE_ARCH_PTEP_MODIFY_PROT_TRANSACTION1407pte_t ptep_modify_prot_start(struct vm_area_struct *, unsigned long, pte_t *);1408void ptep_modify_prot_commit(struct vm_area_struct *, unsigned long,1409pte_t *, pte_t, pte_t);14101411/*1412* Returns true for a R -> RW upgrade of pte1413*/1414static inline bool is_pte_rw_upgrade(unsigned long old_val, unsigned long new_val)1415{1416if (!(old_val & _PAGE_READ))1417return false;14181419if ((!(old_val & _PAGE_WRITE)) && (new_val & _PAGE_WRITE))1420return true;14211422return false;1423}14241425#endif /* __ASSEMBLER__ */1426#endif /* _ASM_POWERPC_BOOK3S_64_PGTABLE_H_ */142714281429