arch/x86/mm/pageattr.c

   1 /*
   2  * Copyright 2002 Andi Kleen, SuSE Labs.
   3  * Thanks to Ben LaHaise for precious feedback.
   4  */
   5 #include <linux/highmem.h>
   6 #include <linux/bootmem.h>
   7 #include <linux/module.h>
   8 #include <linux/sched.h>
   9 #include <linux/slab.h>
  10 #include <linux/mm.h>
  11 #include <linux/interrupt.h>
  12
  13 #include <asm/e820.h>
  14 #include <asm/processor.h>
  15 #include <asm/tlbflush.h>
  16 #include <asm/sections.h>
  17 #include <asm/uaccess.h>
  18 #include <asm/pgalloc.h>
  19
  20 /*
  21  * The current flushing context - we pass it instead of 5 arguments:
  22  */
  23 struct cpa_data {
  24         unsigned long   vaddr;
  25         pgprot_t        mask_set;
  26         pgprot_t        mask_clr;
  27         int             numpages;
  28         int             flushtlb;
  29 };
  30
  31 static inline int
  32 within(unsigned long addr, unsigned long start, unsigned long end)
  33 {
  34         return addr >= start && addr < end;
  35 }
  36
  37 /*
  38  * Flushing functions
  39  */
  40
  41 /**
  42  * clflush_cache_range - flush a cache range with clflush
  43  * @addr:       virtual start address
  44  * @size:       number of bytes to flush
  45  *
  46  * clflush is an unordered instruction which needs fencing with mfence
  47  * to avoid ordering issues.
  48  */
  49 void clflush_cache_range(void *vaddr, unsigned int size)
  50 {
  51         void *vend = vaddr + size - 1;
  52
  53         mb();
  54
  55         for (; vaddr < vend; vaddr += boot_cpu_data.x86_clflush_size)
  56                 clflush(vaddr);
  57         /*
  58          * Flush any possible final partial cacheline:
  59          */
  60         clflush(vend);
  61
  62         mb();
  63 }
  64
  65 static void __cpa_flush_all(void *arg)
  66 {
  67         unsigned long cache = (unsigned long)arg;
  68
  69         /*
  70          * Flush all to work around Errata in early athlons regarding
  71          * large page flushing.
  72          */
  73         __flush_tlb_all();
  74
  75         if (cache && boot_cpu_data.x86_model >= 4)
  76                 wbinvd();
  77 }
  78
  79 static void cpa_flush_all(unsigned long cache)
  80 {
  81         BUG_ON(irqs_disabled());
  82
  83         on_each_cpu(__cpa_flush_all, (void *) cache, 1, 1);
  84 }
  85
  86 static void __cpa_flush_range(void *arg)
  87 {
  88         /*
  89          * We could optimize that further and do individual per page
  90          * tlb invalidates for a low number of pages. Caveat: we must
  91          * flush the high aliases on 64bit as well.
  92          */
  93         __flush_tlb_all();
  94 }
  95
  96 static void cpa_flush_range(unsigned long start, int numpages, int cache)
  97 {
  98         unsigned int i, level;
  99         unsigned long addr;
 100
 101         BUG_ON(irqs_disabled());
 102         WARN_ON(PAGE_ALIGN(start) != start);
 103
 104         on_each_cpu(__cpa_flush_range, NULL, 1, 1);
 105
 106         if (!cache)
 107                 return;
 108
 109         /*
 110          * We only need to flush on one CPU,
 111          * clflush is a MESI-coherent instruction that
 112          * will cause all other CPUs to flush the same
 113          * cachelines:
 114          */
 115         for (i = 0, addr = start; i < numpages; i++, addr += PAGE_SIZE) {
 116                 pte_t *pte = lookup_address(addr, &level);
 117
 118                 /*
 119                  * Only flush present addresses:
 120                  */
 121                 if (pte && (pte_val(*pte) & _PAGE_PRESENT))
 122                         clflush_cache_range((void *) addr, PAGE_SIZE);
 123         }
 124 }
 125
 126 #define HIGH_MAP_START  __START_KERNEL_map
 127 #define HIGH_MAP_END    (__START_KERNEL_map + KERNEL_TEXT_SIZE)
 128
 129
 130 /*
 131  * Converts a virtual address to a X86-64 highmap address
 132  */
 133 static unsigned long virt_to_highmap(void *address)
 134 {
 135 #ifdef CONFIG_X86_64
 136         return __pa((unsigned long)address) + HIGH_MAP_START - phys_base;
 137 #else
 138         return (unsigned long)address;
 139 #endif
 140 }
 141
 142 /*
 143  * Certain areas of memory on x86 require very specific protection flags,
 144  * for example the BIOS area or kernel text. Callers don't always get this
 145  * right (again, ioremap() on BIOS memory is not uncommon) so this function
 146  * checks and fixes these known static required protection bits.
 147  */
 148 static inline pgprot_t static_protections(pgprot_t prot, unsigned long address)
 149 {
 150         pgprot_t forbidden = __pgprot(0);
 151
 152         /*
 153          * The BIOS area between 640k and 1Mb needs to be executable for
 154          * PCI BIOS based config access (CONFIG_PCI_GOBIOS) support.
 155          */
 156         if (within(__pa(address), BIOS_BEGIN, BIOS_END))
 157                 pgprot_val(forbidden) |= _PAGE_NX;
 158
 159         /*
 160          * The kernel text needs to be executable for obvious reasons
 161          * Does not cover __inittext since that is gone later on
 162          */
 163         if (within(address, (unsigned long)_text, (unsigned long)_etext))
 164                 pgprot_val(forbidden) |= _PAGE_NX;
 165         /*
 166          * Do the same for the x86-64 high kernel mapping
 167          */
 168         if (within(address, virt_to_highmap(_text), virt_to_highmap(_etext)))
 169                 pgprot_val(forbidden) |= _PAGE_NX;
 170
 171         /* The .rodata section needs to be read-only */
 172         if (within(address, (unsigned long)__start_rodata,
 173                                 (unsigned long)__end_rodata))
 174                 pgprot_val(forbidden) |= _PAGE_RW;
 175         /*
 176          * Do the same for the x86-64 high kernel mapping
 177          */
 178         if (within(address, virt_to_highmap(__start_rodata),
 179                                 virt_to_highmap(__end_rodata)))
 180                 pgprot_val(forbidden) |= _PAGE_RW;
 181
 182         prot = __pgprot(pgprot_val(prot) & ~pgprot_val(forbidden));
 183
 184         return prot;
 185 }
 186
 187 /*
 188  * Lookup the page table entry for a virtual address. Return a pointer
 189  * to the entry and the level of the mapping.
 190  *
 191  * Note: We return pud and pmd either when the entry is marked large
 192  * or when the present bit is not set. Otherwise we would return a
 193  * pointer to a nonexisting mapping.
 194  */
 195 pte_t *lookup_address(unsigned long address, unsigned int *level)
 196 {
 197         pgd_t *pgd = pgd_offset_k(address);
 198         pud_t *pud;
 199         pmd_t *pmd;
 200
 201         *level = PG_LEVEL_NONE;
 202
 203         if (pgd_none(*pgd))
 204                 return NULL;
 205
 206         pud = pud_offset(pgd, address);
 207         if (pud_none(*pud))
 208                 return NULL;
 209
 210         *level = PG_LEVEL_1G;
 211         if (pud_large(*pud) || !pud_present(*pud))
 212                 return (pte_t *)pud;
 213
 214         pmd = pmd_offset(pud, address);
 215         if (pmd_none(*pmd))
 216                 return NULL;
 217
 218         *level = PG_LEVEL_2M;
 219         if (pmd_large(*pmd) || !pmd_present(*pmd))
 220                 return (pte_t *)pmd;
 221
 222         *level = PG_LEVEL_4K;
 223
 224         return pte_offset_kernel(pmd, address);
 225 }
 226
 227 /*
 228  * Set the new pmd in all the pgds we know about:
 229  */
 230 static void __set_pmd_pte(pte_t *kpte, unsigned long address, pte_t pte)
 231 {
 232         /* change init_mm */
 233         set_pte_atomic(kpte, pte);
 234 #ifdef CONFIG_X86_32
 235         if (!SHARED_KERNEL_PMD) {
 236                 struct page *page;
 237
 238                 list_for_each_entry(page, &pgd_list, lru) {
 239                         pgd_t *pgd;
 240                         pud_t *pud;
 241                         pmd_t *pmd;
 242
 243                         pgd = (pgd_t *)page_address(page) + pgd_index(address);
 244                         pud = pud_offset(pgd, address);
 245                         pmd = pmd_offset(pud, address);
 246                         set_pte_atomic((pte_t *)pmd, pte);
 247                 }
 248         }
 249 #endif
 250 }
 251
 252 static int
 253 try_preserve_large_page(pte_t *kpte, unsigned long address,
 254                         struct cpa_data *cpa)
 255 {
 256         unsigned long nextpage_addr, numpages, pmask, psize, flags;
 257         pte_t new_pte, old_pte, *tmp;
 258         pgprot_t old_prot, new_prot;
 259         int do_split = 1;
 260         unsigned int level;
 261
 262         spin_lock_irqsave(&pgd_lock, flags);
 263         /*
 264          * Check for races, another CPU might have split this page
 265          * up already:
 266          */
 267         tmp = lookup_address(address, &level);
 268         if (tmp != kpte)
 269                 goto out_unlock;
 270
 271         switch (level) {
 272         case PG_LEVEL_2M:
 273                 psize = PMD_PAGE_SIZE;
 274                 pmask = PMD_PAGE_MASK;
 275                 break;
 276 #ifdef CONFIG_X86_64
 277         case PG_LEVEL_1G:
 278                 psize = PMD_PAGE_SIZE;
 279                 pmask = PMD_PAGE_MASK;
 280                 break;
 281 #endif
 282         default:
 283                 do_split = -EINVAL;
 284                 goto out_unlock;
 285         }
 286
 287         /*
 288          * Calculate the number of pages, which fit into this large
 289          * page starting at address:
 290          */
 291         nextpage_addr = (address + psize) & pmask;
 292         numpages = (nextpage_addr - address) >> PAGE_SHIFT;
 293         if (numpages < cpa->numpages)
 294                 cpa->numpages = numpages;
 295
 296         /*
 297          * We are safe now. Check whether the new pgprot is the same:
 298          */
 299         old_pte = *kpte;
 300         old_prot = new_prot = pte_pgprot(old_pte);
 301
 302         pgprot_val(new_prot) &= ~pgprot_val(cpa->mask_clr);
 303         pgprot_val(new_prot) |= pgprot_val(cpa->mask_set);
 304         new_prot = static_protections(new_prot, address);
 305
 306         /*
 307          * If there are no changes, return. maxpages has been updated
 308          * above:
 309          */
 310         if (pgprot_val(new_prot) == pgprot_val(old_prot)) {
 311                 do_split = 0;
 312                 goto out_unlock;
 313         }
 314
 315         /*
 316          * We need to change the attributes. Check, whether we can
 317          * change the large page in one go. We request a split, when
 318          * the address is not aligned and the number of pages is
 319          * smaller than the number of pages in the large page. Note
 320          * that we limited the number of possible pages already to
 321          * the number of pages in the large page.
 322          */
 323         if (address == (nextpage_addr - psize) && cpa->numpages == numpages) {
 324                 /*
 325                  * The address is aligned and the number of pages
 326                  * covers the full page.
 327                  */
 328                 new_pte = pfn_pte(pte_pfn(old_pte), canon_pgprot(new_prot));
 329                 __set_pmd_pte(kpte, address, new_pte);
 330                 cpa->flushtlb = 1;
 331                 do_split = 0;
 332         }
 333
 334 out_unlock:
 335         spin_unlock_irqrestore(&pgd_lock, flags);
 336
 337         return do_split;
 338 }
 339
 340 static LIST_HEAD(page_pool);
 341 static unsigned long pool_size, pool_pages, pool_low;
 342 static unsigned long pool_used, pool_failed, pool_refill;
 343
 344 static void cpa_fill_pool(void)
 345 {
 346         struct page *p;
 347         gfp_t gfp = GFP_KERNEL;
 348
 349         /* Do not allocate from interrupt context */
 350         if (in_irq() || irqs_disabled())
 351                 return;
 352         /*
 353          * Check unlocked. I does not matter when we have one more
 354          * page in the pool. The bit lock avoids recursive pool
 355          * allocations:
 356          */
 357         if (pool_pages >= pool_size || test_and_set_bit_lock(0, &pool_refill))
 358                 return;
 359
 360 #ifdef CONFIG_DEBUG_PAGEALLOC
 361         /*
 362          * We could do:
 363          * gfp = in_atomic() ? GFP_ATOMIC : GFP_KERNEL;
 364          * but this fails on !PREEMPT kernels
 365          */
 366         gfp =  GFP_ATOMIC | __GFP_NORETRY | __GFP_NOWARN;
 367 #endif
 368
 369         while (pool_pages < pool_size) {
 370                 p = alloc_pages(gfp, 0);
 371                 if (!p) {
 372                         pool_failed++;
 373                         break;
 374                 }
 375                 spin_lock_irq(&pgd_lock);
 376                 list_add(&p->lru, &page_pool);
 377                 pool_pages++;
 378                 spin_unlock_irq(&pgd_lock);
 379         }
 380         clear_bit_unlock(0, &pool_refill);
 381 }
 382
 383 #define SHIFT_MB                (20 - PAGE_SHIFT)
 384 #define ROUND_MB_GB             ((1 << 10) - 1)
 385 #define SHIFT_MB_GB             10
 386 #define POOL_PAGES_PER_GB       16
 387
 388 void __init cpa_init(void)
 389 {
 390         struct sysinfo si;
 391         unsigned long gb;
 392
 393         si_meminfo(&si);
 394         /*
 395          * Calculate the number of pool pages:
 396          *
 397          * Convert totalram (nr of pages) to MiB and round to the next
 398          * GiB. Shift MiB to Gib and multiply the result by
 399          * POOL_PAGES_PER_GB:
 400          */
 401         gb = ((si.totalram >> SHIFT_MB) + ROUND_MB_GB) >> SHIFT_MB_GB;
 402         pool_size = POOL_PAGES_PER_GB * gb;
 403         pool_low = pool_size;
 404
 405         cpa_fill_pool();
 406         printk(KERN_DEBUG
 407                "CPA: page pool initialized %lu of %lu pages preallocated\n",
 408                pool_pages, pool_size);
 409 }
 410
 411 static int split_large_page(pte_t *kpte, unsigned long address)
 412 {
 413         unsigned long flags, pfn, pfninc = 1;
 414         gfp_t gfp_flags = GFP_KERNEL;
 415         unsigned int i, level;
 416         pte_t *pbase, *tmp;
 417         pgprot_t ref_prot;
 418         struct page *base;
 419
 420 #ifdef CONFIG_DEBUG_PAGEALLOC
 421         gfp_flags = GFP_ATOMIC | __GFP_NOWARN;
 422 #endif
 423         base = alloc_pages(gfp_flags, 0);
 424         if (!base)
 425                 return -ENOMEM;
 426
 427         spin_lock_irqsave(&pgd_lock, flags);
 428         /*
 429          * Check for races, another CPU might have split this page
 430          * up for us already:
 431          */
 432         tmp = lookup_address(address, &level);
 433         if (tmp != kpte)
 434                 goto out_unlock;
 435
 436         pbase = (pte_t *)page_address(base);
 437 #ifdef CONFIG_X86_32
 438         paravirt_alloc_pt(&init_mm, page_to_pfn(base));
 439 #endif
 440         ref_prot = pte_pgprot(pte_clrhuge(*kpte));
 441
 442 #ifdef CONFIG_X86_64
 443         if (level == PG_LEVEL_1G) {
 444                 pfninc = PMD_PAGE_SIZE >> PAGE_SHIFT;
 445                 pgprot_val(ref_prot) |= _PAGE_PSE;
 446         }
 447 #endif
 448
 449         /*
 450          * Get the target pfn from the original entry:
 451          */
 452         pfn = pte_pfn(*kpte);
 453         for (i = 0; i < PTRS_PER_PTE; i++, pfn += pfninc)
 454                 set_pte(&pbase[i], pfn_pte(pfn, ref_prot));
 455
 456         /*
 457          * Install the new, split up pagetable. Important details here:
 458          *
 459          * On Intel the NX bit of all levels must be cleared to make a
 460          * page executable. See section 4.13.2 of Intel 64 and IA-32
 461          * Architectures Software Developer's Manual).
 462          *
 463          * Mark the entry present. The current mapping might be
 464          * set to not present, which we preserved above.
 465          */
 466         ref_prot = pte_pgprot(pte_mkexec(pte_clrhuge(*kpte)));
 467         pgprot_val(ref_prot) |= _PAGE_PRESENT;
 468         __set_pmd_pte(kpte, address, mk_pte(base, ref_prot));
 469         base = NULL;
 470
 471 out_unlock:
 472         spin_unlock_irqrestore(&pgd_lock, flags);
 473
 474         if (base)
 475                 __free_pages(base, 0);
 476
 477         return 0;
 478 }
 479
 480 static int __change_page_attr(unsigned long address, struct cpa_data *cpa)
 481 {
 482         int do_split, err;
 483         unsigned int level;
 484         struct page *kpte_page;
 485         pte_t *kpte;
 486
 487 repeat:
 488         kpte = lookup_address(address, &level);
 489         if (!kpte)
 490                 return -EINVAL;
 491
 492         kpte_page = virt_to_page(kpte);
 493         BUG_ON(PageLRU(kpte_page));
 494         BUG_ON(PageCompound(kpte_page));
 495
 496         if (level == PG_LEVEL_4K) {
 497                 pte_t new_pte, old_pte = *kpte;
 498                 pgprot_t new_prot = pte_pgprot(old_pte);
 499
 500                 if(!pte_val(old_pte)) {
 501                         printk(KERN_WARNING "CPA: called for zero pte. "
 502                                "vaddr = %lx cpa->vaddr = %lx\n", address,
 503                                 cpa->vaddr);
 504                         WARN_ON(1);
 505                         return -EINVAL;
 506                 }
 507
 508                 pgprot_val(new_prot) &= ~pgprot_val(cpa->mask_clr);
 509                 pgprot_val(new_prot) |= pgprot_val(cpa->mask_set);
 510
 511                 new_prot = static_protections(new_prot, address);
 512
 513                 /*
 514                  * We need to keep the pfn from the existing PTE,
 515                  * after all we're only going to change it's attributes
 516                  * not the memory it points to
 517                  */
 518                 new_pte = pfn_pte(pte_pfn(old_pte), canon_pgprot(new_prot));
 519
 520                 /*
 521                  * Do we really change anything ?
 522                  */
 523                 if (pte_val(old_pte) != pte_val(new_pte)) {
 524                         set_pte_atomic(kpte, new_pte);
 525                         cpa->flushtlb = 1;
 526                 }
 527                 cpa->numpages = 1;
 528                 return 0;
 529         }
 530
 531         /*
 532          * Check, whether we can keep the large page intact
 533          * and just change the pte:
 534          */
 535         do_split = try_preserve_large_page(kpte, address, cpa);
 536         /*
 537          * When the range fits into the existing large page,
 538          * return. cp->numpages and cpa->tlbflush have been updated in
 539          * try_large_page:
 540          */
 541         if (do_split <= 0)
 542                 return do_split;
 543
 544         /*
 545          * We have to split the large page:
 546          */
 547         err = split_large_page(kpte, address);
 548         if (!err) {
 549                 cpa->flushtlb = 1;
 550                 goto repeat;
 551         }
 552
 553         return err;
 554 }
 555
 556 /**
 557  * change_page_attr_addr - Change page table attributes in linear mapping
 558  * @address: Virtual address in linear mapping.
 559  * @prot:    New page table attribute (PAGE_*)
 560  *
 561  * Change page attributes of a page in the direct mapping. This is a variant
 562  * of change_page_attr() that also works on memory holes that do not have
 563  * mem_map entry (pfn_valid() is false).
 564  *
 565  * See change_page_attr() documentation for more details.
 566  *
 567  * Modules and drivers should use the set_memory_* APIs instead.
 568  */
 569 static int change_page_attr_addr(struct cpa_data *cpa)
 570 {
 571         int err;
 572         unsigned long address = cpa->vaddr;
 573
 574 #ifdef CONFIG_X86_64
 575         unsigned long phys_addr = __pa(address);
 576
 577         /*
 578          * If we are inside the high mapped kernel range, then we
 579          * fixup the low mapping first. __va() returns the virtual
 580          * address in the linear mapping:
 581          */
 582         if (within(address, HIGH_MAP_START, HIGH_MAP_END))
 583                 address = (unsigned long) __va(phys_addr);
 584 #endif
 585
 586         err = __change_page_attr(address, cpa);
 587         if (err)
 588                 return err;
 589
 590 #ifdef CONFIG_X86_64
 591         /*
 592          * If the physical address is inside the kernel map, we need
 593          * to touch the high mapped kernel as well:
 594          */
 595         if (within(phys_addr, 0, KERNEL_TEXT_SIZE)) {
 596                 /*
 597                  * Calc the high mapping address. See __phys_addr()
 598                  * for the non obvious details.
 599                  *
 600                  * Note that NX and other required permissions are
 601                  * checked in static_protections().
 602                  */
 603                 address = phys_addr + HIGH_MAP_START - phys_base;
 604
 605                 /*
 606                  * Our high aliases are imprecise, because we check
 607                  * everything between 0 and KERNEL_TEXT_SIZE, so do
 608                  * not propagate lookup failures back to users:
 609                  */
 610                 __change_page_attr(address, cpa);
 611         }
 612 #endif
 613         return err;
 614 }
 615
 616 static int __change_page_attr_set_clr(struct cpa_data *cpa)
 617 {
 618         int ret, numpages = cpa->numpages;
 619
 620         while (numpages) {
 621                 /*
 622                  * Store the remaining nr of pages for the large page
 623                  * preservation check.
 624                  */
 625                 cpa->numpages = numpages;
 626                 ret = change_page_attr_addr(cpa);
 627                 if (ret)
 628                         return ret;
 629
 630                 /*
 631                  * Adjust the number of pages with the result of the
 632                  * CPA operation. Either a large page has been
 633                  * preserved or a single page update happened.
 634                  */
 635                 BUG_ON(cpa->numpages > numpages);
 636                 numpages -= cpa->numpages;
 637                 cpa->vaddr += cpa->numpages * PAGE_SIZE;
 638         }
 639         return 0;
 640 }
 641
 642 static inline int cache_attr(pgprot_t attr)
 643 {
 644         return pgprot_val(attr) &
 645                 (_PAGE_PAT | _PAGE_PAT_LARGE | _PAGE_PWT | _PAGE_PCD);
 646 }
 647
 648 static int change_page_attr_set_clr(unsigned long addr, int numpages,
 649                                     pgprot_t mask_set, pgprot_t mask_clr)
 650 {
 651         struct cpa_data cpa;
 652         int ret, cache;
 653
 654         /*
 655          * Check, if we are requested to change a not supported
 656          * feature:
 657          */
 658         mask_set = canon_pgprot(mask_set);
 659         mask_clr = canon_pgprot(mask_clr);
 660         if (!pgprot_val(mask_set) && !pgprot_val(mask_clr))
 661                 return 0;
 662
 663         cpa.vaddr = addr;
 664         cpa.numpages = numpages;
 665         cpa.mask_set = mask_set;
 666         cpa.mask_clr = mask_clr;
 667         cpa.flushtlb = 0;
 668
 669         ret = __change_page_attr_set_clr(&cpa);
 670
 671         /*
 672          * Check whether we really changed something:
 673          */
 674         if (!cpa.flushtlb)
 675                 goto out;
 676
 677         /*
 678          * No need to flush, when we did not set any of the caching
 679          * attributes:
 680          */
 681         cache = cache_attr(mask_set);
 682
 683         /*
 684          * On success we use clflush, when the CPU supports it to
 685          * avoid the wbindv. If the CPU does not support it and in the
 686          * error case we fall back to cpa_flush_all (which uses
 687          * wbindv):
 688          */
 689         if (!ret && cpu_has_clflush)
 690                 cpa_flush_range(addr, numpages, cache);
 691         else
 692                 cpa_flush_all(cache);
 693
 694 out:
 695         cpa_fill_pool();
 696         return ret;
 697 }
 698
 699 static inline int change_page_attr_set(unsigned long addr, int numpages,
 700                                        pgprot_t mask)
 701 {
 702         return change_page_attr_set_clr(addr, numpages, mask, __pgprot(0));
 703 }
 704
 705 static inline int change_page_attr_clear(unsigned long addr, int numpages,
 706                                          pgprot_t mask)
 707 {
 708         return change_page_attr_set_clr(addr, numpages, __pgprot(0), mask);
 709 }
 710
 711 int set_memory_uc(unsigned long addr, int numpages)
 712 {
 713         return change_page_attr_set(addr, numpages,
 714                                     __pgprot(_PAGE_PCD | _PAGE_PWT));
 715 }
 716 EXPORT_SYMBOL(set_memory_uc);
 717
 718 int set_memory_wb(unsigned long addr, int numpages)
 719 {
 720         return change_page_attr_clear(addr, numpages,
 721                                       __pgprot(_PAGE_PCD | _PAGE_PWT));
 722 }
 723 EXPORT_SYMBOL(set_memory_wb);
 724
 725 int set_memory_x(unsigned long addr, int numpages)
 726 {
 727         return change_page_attr_clear(addr, numpages, __pgprot(_PAGE_NX));
 728 }
 729 EXPORT_SYMBOL(set_memory_x);
 730
 731 int set_memory_nx(unsigned long addr, int numpages)
 732 {
 733         return change_page_attr_set(addr, numpages, __pgprot(_PAGE_NX));
 734 }
 735 EXPORT_SYMBOL(set_memory_nx);
 736
 737 int set_memory_ro(unsigned long addr, int numpages)
 738 {
 739         return change_page_attr_clear(addr, numpages, __pgprot(_PAGE_RW));
 740 }
 741
 742 int set_memory_rw(unsigned long addr, int numpages)
 743 {
 744         return change_page_attr_set(addr, numpages, __pgprot(_PAGE_RW));
 745 }
 746
 747 int set_memory_np(unsigned long addr, int numpages)
 748 {
 749         return change_page_attr_clear(addr, numpages, __pgprot(_PAGE_PRESENT));
 750 }
 751
 752 int set_pages_uc(struct page *page, int numpages)
 753 {
 754         unsigned long addr = (unsigned long)page_address(page);
 755
 756         return set_memory_uc(addr, numpages);
 757 }
 758 EXPORT_SYMBOL(set_pages_uc);
 759
 760 int set_pages_wb(struct page *page, int numpages)
 761 {
 762         unsigned long addr = (unsigned long)page_address(page);
 763
 764         return set_memory_wb(addr, numpages);
 765 }
 766 EXPORT_SYMBOL(set_pages_wb);
 767
 768 int set_pages_x(struct page *page, int numpages)
 769 {
 770         unsigned long addr = (unsigned long)page_address(page);
 771
 772         return set_memory_x(addr, numpages);
 773 }
 774 EXPORT_SYMBOL(set_pages_x);
 775
 776 int set_pages_nx(struct page *page, int numpages)
 777 {
 778         unsigned long addr = (unsigned long)page_address(page);
 779
 780         return set_memory_nx(addr, numpages);
 781 }
 782 EXPORT_SYMBOL(set_pages_nx);
 783
 784 int set_pages_ro(struct page *page, int numpages)
 785 {
 786         unsigned long addr = (unsigned long)page_address(page);
 787
 788         return set_memory_ro(addr, numpages);
 789 }
 790
 791 int set_pages_rw(struct page *page, int numpages)
 792 {
 793         unsigned long addr = (unsigned long)page_address(page);
 794
 795         return set_memory_rw(addr, numpages);
 796 }
 797
 798 #ifdef CONFIG_DEBUG_PAGEALLOC
 799
 800 static int __set_pages_p(struct page *page, int numpages)
 801 {
 802         struct cpa_data cpa = { .vaddr = (unsigned long) page_address(page),
 803                                 .numpages = numpages,
 804                                 .mask_set = __pgprot(_PAGE_PRESENT | _PAGE_RW),
 805                                 .mask_clr = __pgprot(0)};
 806
 807         return __change_page_attr_set_clr(&cpa);
 808 }
 809
 810 static int __set_pages_np(struct page *page, int numpages)
 811 {
 812         struct cpa_data cpa = { .vaddr = (unsigned long) page_address(page),
 813                                 .numpages = numpages,
 814                                 .mask_set = __pgprot(0),
 815                                 .mask_clr = __pgprot(_PAGE_PRESENT | _PAGE_RW)};
 816
 817         return __change_page_attr_set_clr(&cpa);
 818 }
 819
 820 void kernel_map_pages(struct page *page, int numpages, int enable)
 821 {
 822         if (PageHighMem(page))
 823                 return;
 824         if (!enable) {
 825                 debug_check_no_locks_freed(page_address(page),
 826                                            numpages * PAGE_SIZE);
 827         }
 828
 829         /*
 830          * If page allocator is not up yet then do not call c_p_a():
 831          */
 832         if (!debug_pagealloc_enabled)
 833                 return;
 834
 835         /*
 836          * The return value is ignored - the calls cannot fail,
 837          * large pages are disabled at boot time:
 838          */
 839         if (enable)
 840                 __set_pages_p(page, numpages);
 841         else
 842                 __set_pages_np(page, numpages);
 843
 844         /*
 845          * We should perform an IPI and flush all tlbs,
 846          * but that can deadlock->flush only current cpu:
 847          */
 848         __flush_tlb_all();
 849
 850         /*
 851          * Try to refill the page pool here. We can do this only after
 852          * the tlb flush.
 853          */
 854         cpa_fill_pool();
 855 }
 856 #endif
 857
 858 /*
 859  * The testcases use internal knowledge of the implementation that shouldn't
 860  * be exposed to the rest of the kernel. Include these directly here.
 861  */
 862 #ifdef CONFIG_CPA_DEBUG
 863 #include "pageattr-test.c"
 864 #endif