arch/x86/mm/pageattr.c

   1 /*
   2  * Copyright 2002 Andi Kleen, SuSE Labs.
   3  * Thanks to Ben LaHaise for precious feedback.
   4  */
   5 #include <linux/highmem.h>
   6 #include <linux/bootmem.h>
   7 #include <linux/module.h>
   8 #include <linux/sched.h>
   9 #include <linux/slab.h>
  10 #include <linux/mm.h>
  11
  12 #include <asm/e820.h>
  13 #include <asm/processor.h>
  14 #include <asm/tlbflush.h>
  15 #include <asm/sections.h>
  16 #include <asm/uaccess.h>
  17 #include <asm/pgalloc.h>
  18
  19 struct cpa_data {
  20         unsigned long   vaddr;
  21         pgprot_t        mask_set;
  22         pgprot_t        mask_clr;
  23         int             numpages;
  24         int             flushtlb;
  25 };
  26
  27 enum {
  28         CPA_NO_SPLIT = 0,
  29         CPA_SPLIT,
  30 };
  31
  32 static inline int
  33 within(unsigned long addr, unsigned long start, unsigned long end)
  34 {
  35         return addr >= start && addr < end;
  36 }
  37
  38 /*
  39  * Flushing functions
  40  */
  41
  42 /**
  43  * clflush_cache_range - flush a cache range with clflush
  44  * @addr:       virtual start address
  45  * @size:       number of bytes to flush
  46  *
  47  * clflush is an unordered instruction which needs fencing with mfence
  48  * to avoid ordering issues.
  49  */
  50 void clflush_cache_range(void *vaddr, unsigned int size)
  51 {
  52         void *vend = vaddr + size - 1;
  53
  54         mb();
  55
  56         for (; vaddr < vend; vaddr += boot_cpu_data.x86_clflush_size)
  57                 clflush(vaddr);
  58         /*
  59          * Flush any possible final partial cacheline:
  60          */
  61         clflush(vend);
  62
  63         mb();
  64 }
  65
  66 static void __cpa_flush_all(void *arg)
  67 {
  68         unsigned long cache = (unsigned long)arg;
  69
  70         /*
  71          * Flush all to work around Errata in early athlons regarding
  72          * large page flushing.
  73          */
  74         __flush_tlb_all();
  75
  76         if (cache && boot_cpu_data.x86_model >= 4)
  77                 wbinvd();
  78 }
  79
  80 static void cpa_flush_all(unsigned long cache)
  81 {
  82         BUG_ON(irqs_disabled());
  83
  84         on_each_cpu(__cpa_flush_all, (void *) cache, 1, 1);
  85 }
  86
  87 static void __cpa_flush_range(void *arg)
  88 {
  89         /*
  90          * We could optimize that further and do individual per page
  91          * tlb invalidates for a low number of pages. Caveat: we must
  92          * flush the high aliases on 64bit as well.
  93          */
  94         __flush_tlb_all();
  95 }
  96
  97 static void cpa_flush_range(unsigned long start, int numpages, int cache)
  98 {
  99         unsigned int i, level;
 100         unsigned long addr;
 101
 102         BUG_ON(irqs_disabled());
 103         WARN_ON(PAGE_ALIGN(start) != start);
 104
 105         on_each_cpu(__cpa_flush_range, NULL, 1, 1);
 106
 107         if (!cache)
 108                 return;
 109
 110         /*
 111          * We only need to flush on one CPU,
 112          * clflush is a MESI-coherent instruction that
 113          * will cause all other CPUs to flush the same
 114          * cachelines:
 115          */
 116         for (i = 0, addr = start; i < numpages; i++, addr += PAGE_SIZE) {
 117                 pte_t *pte = lookup_address(addr, &level);
 118
 119                 /*
 120                  * Only flush present addresses:
 121                  */
 122                 if (pte && pte_present(*pte))
 123                         clflush_cache_range((void *) addr, PAGE_SIZE);
 124         }
 125 }
 126
 127 #define HIGH_MAP_START  __START_KERNEL_map
 128 #define HIGH_MAP_END    (__START_KERNEL_map + KERNEL_TEXT_SIZE)
 129
 130
 131 /*
 132  * Converts a virtual address to a X86-64 highmap address
 133  */
 134 static unsigned long virt_to_highmap(void *address)
 135 {
 136 #ifdef CONFIG_X86_64
 137         return __pa((unsigned long)address) + HIGH_MAP_START - phys_base;
 138 #else
 139         return (unsigned long)address;
 140 #endif
 141 }
 142
 143 /*
 144  * Certain areas of memory on x86 require very specific protection flags,
 145  * for example the BIOS area or kernel text. Callers don't always get this
 146  * right (again, ioremap() on BIOS memory is not uncommon) so this function
 147  * checks and fixes these known static required protection bits.
 148  */
 149 static inline pgprot_t static_protections(pgprot_t prot, unsigned long address)
 150 {
 151         pgprot_t forbidden = __pgprot(0);
 152
 153         /*
 154          * The BIOS area between 640k and 1Mb needs to be executable for
 155          * PCI BIOS based config access (CONFIG_PCI_GOBIOS) support.
 156          */
 157         if (within(__pa(address), BIOS_BEGIN, BIOS_END))
 158                 pgprot_val(forbidden) |= _PAGE_NX;
 159
 160         /*
 161          * The kernel text needs to be executable for obvious reasons
 162          * Does not cover __inittext since that is gone later on
 163          */
 164         if (within(address, (unsigned long)_text, (unsigned long)_etext))
 165                 pgprot_val(forbidden) |= _PAGE_NX;
 166         /*
 167          * Do the same for the x86-64 high kernel mapping
 168          */
 169         if (within(address, virt_to_highmap(_text), virt_to_highmap(_etext)))
 170                 pgprot_val(forbidden) |= _PAGE_NX;
 171
 172
 173 #ifdef CONFIG_DEBUG_RODATA
 174         /* The .rodata section needs to be read-only */
 175         if (within(address, (unsigned long)__start_rodata,
 176                                 (unsigned long)__end_rodata))
 177                 pgprot_val(forbidden) |= _PAGE_RW;
 178         /*
 179          * Do the same for the x86-64 high kernel mapping
 180          */
 181         if (within(address, virt_to_highmap(__start_rodata),
 182                                 virt_to_highmap(__end_rodata)))
 183                 pgprot_val(forbidden) |= _PAGE_RW;
 184 #endif
 185
 186         prot = __pgprot(pgprot_val(prot) & ~pgprot_val(forbidden));
 187
 188         return prot;
 189 }
 190
 191 /*
 192  * Lookup the page table entry for a virtual address. Return a pointer
 193  * to the entry and the level of the mapping.
 194  *
 195  * Note: We return pud and pmd either when the entry is marked large
 196  * or when the present bit is not set. Otherwise we would return a
 197  * pointer to a nonexisting mapping.
 198  */
 199 pte_t *lookup_address(unsigned long address, int *level)
 200 {
 201         pgd_t *pgd = pgd_offset_k(address);
 202         pud_t *pud;
 203         pmd_t *pmd;
 204
 205         *level = PG_LEVEL_NONE;
 206
 207         if (pgd_none(*pgd))
 208                 return NULL;
 209         pud = pud_offset(pgd, address);
 210         if (pud_none(*pud))
 211                 return NULL;
 212         pmd = pmd_offset(pud, address);
 213         if (pmd_none(*pmd))
 214                 return NULL;
 215
 216         *level = PG_LEVEL_2M;
 217         if (pmd_large(*pmd) || !pmd_present(*pmd))
 218                 return (pte_t *)pmd;
 219
 220         *level = PG_LEVEL_4K;
 221         return pte_offset_kernel(pmd, address);
 222 }
 223
 224 static void __set_pmd_pte(pte_t *kpte, unsigned long address, pte_t pte)
 225 {
 226         /* change init_mm */
 227         set_pte_atomic(kpte, pte);
 228 #ifdef CONFIG_X86_32
 229         if (!SHARED_KERNEL_PMD) {
 230                 struct page *page;
 231
 232                 list_for_each_entry(page, &pgd_list, lru) {
 233                         pgd_t *pgd;
 234                         pud_t *pud;
 235                         pmd_t *pmd;
 236
 237                         pgd = (pgd_t *)page_address(page) + pgd_index(address);
 238                         pud = pud_offset(pgd, address);
 239                         pmd = pmd_offset(pud, address);
 240                         set_pte_atomic((pte_t *)pmd, pte);
 241                 }
 242         }
 243 #endif
 244 }
 245
 246 static int try_preserve_large_page(pte_t *kpte, unsigned long address,
 247                                    struct cpa_data *cpa)
 248 {
 249         unsigned long nextpage_addr, numpages, pmask, psize, flags;
 250         pte_t new_pte, old_pte, *tmp;
 251         pgprot_t old_prot, new_prot;
 252         int level, res = CPA_SPLIT;
 253
 254         /*
 255          * An Athlon 64 X2 showed hard hangs if we tried to preserve
 256          * largepages and changed the PSE entry from RW to RO.
 257          *
 258          * As AMD CPUs have a long series of erratas in this area,
 259          * (and none of the known ones seem to explain this hang),
 260          * disable this code until the hang can be debugged:
 261          */
 262         if (boot_cpu_data.x86_vendor == X86_VENDOR_AMD)
 263                 return res;
 264
 265         spin_lock_irqsave(&pgd_lock, flags);
 266         /*
 267          * Check for races, another CPU might have split this page
 268          * up already:
 269          */
 270         tmp = lookup_address(address, &level);
 271         if (tmp != kpte)
 272                 goto out_unlock;
 273
 274         switch (level) {
 275         case PG_LEVEL_2M:
 276                 psize = PMD_PAGE_SIZE;
 277                 pmask = PMD_PAGE_MASK;
 278                 break;
 279         case PG_LEVEL_1G:
 280         default:
 281                 res = -EINVAL;
 282                 goto out_unlock;
 283         }
 284
 285         /*
 286          * Calculate the number of pages, which fit into this large
 287          * page starting at address:
 288          */
 289         nextpage_addr = (address + psize) & pmask;
 290         numpages = (nextpage_addr - address) >> PAGE_SHIFT;
 291         if (numpages < cpa->numpages)
 292                 cpa->numpages = numpages;
 293
 294         /*
 295          * We are safe now. Check whether the new pgprot is the same:
 296          */
 297         old_pte = *kpte;
 298         old_prot = new_prot = pte_pgprot(old_pte);
 299
 300         pgprot_val(new_prot) &= ~pgprot_val(cpa->mask_clr);
 301         pgprot_val(new_prot) |= pgprot_val(cpa->mask_set);
 302         new_prot = static_protections(new_prot, address);
 303
 304         /*
 305          * If there are no changes, return. maxpages has been updated
 306          * above:
 307          */
 308         if (pgprot_val(new_prot) == pgprot_val(old_prot)) {
 309                 res = CPA_NO_SPLIT;
 310                 goto out_unlock;
 311         }
 312
 313         /*
 314          * We need to change the attributes. Check, whether we can
 315          * change the large page in one go. We request a split, when
 316          * the address is not aligned and the number of pages is
 317          * smaller than the number of pages in the large page. Note
 318          * that we limited the number of possible pages already to
 319          * the number of pages in the large page.
 320          */
 321         if (address == (nextpage_addr - psize) && cpa->numpages == numpages) {
 322                 /*
 323                  * The address is aligned and the number of pages
 324                  * covers the full page.
 325                  */
 326                 new_pte = pfn_pte(pte_pfn(old_pte), canon_pgprot(new_prot));
 327                 __set_pmd_pte(kpte, address, new_pte);
 328                 cpa->flushtlb = 1;
 329                 res = CPA_NO_SPLIT;
 330         }
 331
 332 out_unlock:
 333         spin_unlock_irqrestore(&pgd_lock, flags);
 334         return res;
 335 }
 336
 337 static int split_large_page(pte_t *kpte, unsigned long address)
 338 {
 339         pgprot_t ref_prot;
 340         gfp_t gfp_flags = GFP_KERNEL;
 341         unsigned long flags, addr, pfn;
 342         pte_t *pbase, *tmp;
 343         struct page *base;
 344         unsigned int i, level;
 345
 346 #ifdef CONFIG_DEBUG_PAGEALLOC
 347         gfp_flags = GFP_ATOMIC | __GFP_NOWARN;
 348 #endif
 349         base = alloc_pages(gfp_flags, 0);
 350         if (!base)
 351                 return -ENOMEM;
 352
 353         spin_lock_irqsave(&pgd_lock, flags);
 354         /*
 355          * Check for races, another CPU might have split this page
 356          * up for us already:
 357          */
 358         tmp = lookup_address(address, &level);
 359         if (tmp != kpte) {
 360                 WARN_ON_ONCE(1);
 361                 goto out_unlock;
 362         }
 363
 364         address = __pa(address);
 365         addr = address & PMD_PAGE_MASK;
 366         pbase = (pte_t *)page_address(base);
 367 #ifdef CONFIG_X86_32
 368         paravirt_alloc_pt(&init_mm, page_to_pfn(base));
 369 #endif
 370         ref_prot = pte_pgprot(pte_clrhuge(*kpte));
 371
 372         /*
 373          * Get the target pfn from the original entry:
 374          */
 375         pfn = pte_pfn(*kpte);
 376         for (i = 0; i < PTRS_PER_PTE; i++, pfn++)
 377                 set_pte(&pbase[i], pfn_pte(pfn, ref_prot));
 378
 379         /*
 380          * Install the new, split up pagetable. Important details here:
 381          *
 382          * On Intel the NX bit of all levels must be cleared to make a
 383          * page executable. See section 4.13.2 of Intel 64 and IA-32
 384          * Architectures Software Developer's Manual).
 385          *
 386          * Mark the entry present. The current mapping might be
 387          * set to not present, which we preserved above.
 388          */
 389         ref_prot = pte_pgprot(pte_mkexec(pte_clrhuge(*kpte)));
 390         pgprot_val(ref_prot) |= _PAGE_PRESENT;
 391         __set_pmd_pte(kpte, address, mk_pte(base, ref_prot));
 392         base = NULL;
 393
 394 out_unlock:
 395         spin_unlock_irqrestore(&pgd_lock, flags);
 396
 397         if (base)
 398                 __free_pages(base, 0);
 399
 400         return 0;
 401 }
 402
 403 static int __change_page_attr(unsigned long address, struct cpa_data *cpa)
 404 {
 405         struct page *kpte_page;
 406         int level, res;
 407         pte_t *kpte;
 408
 409 repeat:
 410         kpte = lookup_address(address, &level);
 411         if (!kpte)
 412                 return -EINVAL;
 413
 414         kpte_page = virt_to_page(kpte);
 415         BUG_ON(PageLRU(kpte_page));
 416         BUG_ON(PageCompound(kpte_page));
 417
 418         if (level == PG_LEVEL_4K) {
 419                 pte_t new_pte, old_pte = *kpte;
 420                 pgprot_t new_prot = pte_pgprot(old_pte);
 421
 422                 if(!pte_val(old_pte)) {
 423                         printk(KERN_WARNING "CPA: called for zero pte. "
 424                                "vaddr = %lx cpa->vaddr = %lx\n", address,
 425                                 cpa->vaddr);
 426                         WARN_ON(1);
 427                         return -EINVAL;
 428                 }
 429
 430                 pgprot_val(new_prot) &= ~pgprot_val(cpa->mask_clr);
 431                 pgprot_val(new_prot) |= pgprot_val(cpa->mask_set);
 432
 433                 new_prot = static_protections(new_prot, address);
 434
 435                 /*
 436                  * We need to keep the pfn from the existing PTE,
 437                  * after all we're only going to change it's attributes
 438                  * not the memory it points to
 439                  */
 440                 new_pte = pfn_pte(pte_pfn(old_pte), canon_pgprot(new_prot));
 441
 442                 /*
 443                  * Do we really change anything ?
 444                  */
 445                 if (pte_val(old_pte) != pte_val(new_pte)) {
 446                         set_pte_atomic(kpte, new_pte);
 447                         cpa->flushtlb = 1;
 448                 }
 449                 cpa->numpages = 1;
 450                 return 0;
 451         }
 452
 453         /*
 454          * Check, whether we can keep the large page intact
 455          * and just change the pte:
 456          */
 457         res = try_preserve_large_page(kpte, address, cpa);
 458         if (res < 0)
 459                 return res;
 460
 461         /*
 462          * When the range fits into the existing large page,
 463          * return. cp->numpages and cpa->tlbflush have been updated in
 464          * try_large_page:
 465          */
 466         if (res == CPA_NO_SPLIT)
 467                 return 0;
 468
 469         /*
 470          * We have to split the large page:
 471          */
 472         res = split_large_page(kpte, address);
 473         if (res)
 474                 return res;
 475         cpa->flushtlb = 1;
 476         goto repeat;
 477 }
 478
 479 /**
 480  * change_page_attr_addr - Change page table attributes in linear mapping
 481  * @address: Virtual address in linear mapping.
 482  * @prot:    New page table attribute (PAGE_*)
 483  *
 484  * Change page attributes of a page in the direct mapping. This is a variant
 485  * of change_page_attr() that also works on memory holes that do not have
 486  * mem_map entry (pfn_valid() is false).
 487  *
 488  * See change_page_attr() documentation for more details.
 489  *
 490  * Modules and drivers should use the set_memory_* APIs instead.
 491  */
 492
 493 static int change_page_attr_addr(struct cpa_data *cpa)
 494 {
 495         int err;
 496         unsigned long address = cpa->vaddr;
 497
 498 #ifdef CONFIG_X86_64
 499         unsigned long phys_addr = __pa(address);
 500
 501         /*
 502          * If we are inside the high mapped kernel range, then we
 503          * fixup the low mapping first. __va() returns the virtual
 504          * address in the linear mapping:
 505          */
 506         if (within(address, HIGH_MAP_START, HIGH_MAP_END))
 507                 address = (unsigned long) __va(phys_addr);
 508 #endif
 509
 510         err = __change_page_attr(address, cpa);
 511         if (err)
 512                 return err;
 513
 514 #ifdef CONFIG_X86_64
 515         /*
 516          * If the physical address is inside the kernel map, we need
 517          * to touch the high mapped kernel as well:
 518          */
 519         if (within(phys_addr, 0, KERNEL_TEXT_SIZE)) {
 520                 /*
 521                  * Calc the high mapping address. See __phys_addr()
 522                  * for the non obvious details.
 523                  *
 524                  * Note that NX and other required permissions are
 525                  * checked in static_protections().
 526                  */
 527                 address = phys_addr + HIGH_MAP_START - phys_base;
 528
 529                 /*
 530                  * Our high aliases are imprecise, because we check
 531                  * everything between 0 and KERNEL_TEXT_SIZE, so do
 532                  * not propagate lookup failures back to users:
 533                  */
 534                 __change_page_attr(address, cpa);
 535         }
 536 #endif
 537         return err;
 538 }
 539
 540 static int __change_page_attr_set_clr(struct cpa_data *cpa)
 541 {
 542         int ret, numpages = cpa->numpages;
 543
 544         while (numpages) {
 545                 /*
 546                  * Store the remaining nr of pages for the large page
 547                  * preservation check.
 548                  */
 549                 cpa->numpages = numpages;
 550                 ret = change_page_attr_addr(cpa);
 551                 if (ret)
 552                         return ret;
 553
 554                 /*
 555                  * Adjust the number of pages with the result of the
 556                  * CPA operation. Either a large page has been
 557                  * preserved or a single page update happened.
 558                  */
 559                 BUG_ON(cpa->numpages > numpages);
 560                 numpages -= cpa->numpages;
 561                 cpa->vaddr += cpa->numpages * PAGE_SIZE;
 562         }
 563         return 0;
 564 }
 565
 566 static inline int cache_attr(pgprot_t attr)
 567 {
 568         return pgprot_val(attr) &
 569                 (_PAGE_PAT | _PAGE_PAT_LARGE | _PAGE_PWT | _PAGE_PCD);
 570 }
 571
 572 static int change_page_attr_set_clr(unsigned long addr, int numpages,
 573                                     pgprot_t mask_set, pgprot_t mask_clr)
 574 {
 575         struct cpa_data cpa;
 576         int ret, cache;
 577
 578         /*
 579          * Check, if we are requested to change a not supported
 580          * feature:
 581          */
 582         mask_set = canon_pgprot(mask_set);
 583         mask_clr = canon_pgprot(mask_clr);
 584         if (!pgprot_val(mask_set) && !pgprot_val(mask_clr))
 585                 return 0;
 586
 587         cpa.vaddr = addr;
 588         cpa.numpages = numpages;
 589         cpa.mask_set = mask_set;
 590         cpa.mask_clr = mask_clr;
 591         cpa.flushtlb = 0;
 592
 593         ret = __change_page_attr_set_clr(&cpa);
 594
 595         /*
 596          * Check whether we really changed something:
 597          */
 598         if (!cpa.flushtlb)
 599                 return ret;
 600
 601         /*
 602          * No need to flush, when we did not set any of the caching
 603          * attributes:
 604          */
 605         cache = cache_attr(mask_set);
 606
 607         /*
 608          * On success we use clflush, when the CPU supports it to
 609          * avoid the wbindv. If the CPU does not support it and in the
 610          * error case we fall back to cpa_flush_all (which uses
 611          * wbindv):
 612          */
 613         if (!ret && cpu_has_clflush)
 614                 cpa_flush_range(addr, numpages, cache);
 615         else
 616                 cpa_flush_all(cache);
 617
 618         return ret;
 619 }
 620
 621 static inline int change_page_attr_set(unsigned long addr, int numpages,
 622                                        pgprot_t mask)
 623 {
 624         return change_page_attr_set_clr(addr, numpages, mask, __pgprot(0));
 625 }
 626
 627 static inline int change_page_attr_clear(unsigned long addr, int numpages,
 628                                          pgprot_t mask)
 629 {
 630         return change_page_attr_set_clr(addr, numpages, __pgprot(0), mask);
 631 }
 632
 633 int set_memory_uc(unsigned long addr, int numpages)
 634 {
 635         return change_page_attr_set(addr, numpages,
 636                                     __pgprot(_PAGE_PCD | _PAGE_PWT));
 637 }
 638 EXPORT_SYMBOL(set_memory_uc);
 639
 640 int set_memory_wb(unsigned long addr, int numpages)
 641 {
 642         return change_page_attr_clear(addr, numpages,
 643                                       __pgprot(_PAGE_PCD | _PAGE_PWT));
 644 }
 645 EXPORT_SYMBOL(set_memory_wb);
 646
 647 int set_memory_x(unsigned long addr, int numpages)
 648 {
 649         return change_page_attr_clear(addr, numpages, __pgprot(_PAGE_NX));
 650 }
 651 EXPORT_SYMBOL(set_memory_x);
 652
 653 int set_memory_nx(unsigned long addr, int numpages)
 654 {
 655         return change_page_attr_set(addr, numpages, __pgprot(_PAGE_NX));
 656 }
 657 EXPORT_SYMBOL(set_memory_nx);
 658
 659 int set_memory_ro(unsigned long addr, int numpages)
 660 {
 661         return change_page_attr_clear(addr, numpages, __pgprot(_PAGE_RW));
 662 }
 663
 664 int set_memory_rw(unsigned long addr, int numpages)
 665 {
 666         return change_page_attr_set(addr, numpages, __pgprot(_PAGE_RW));
 667 }
 668
 669 int set_memory_np(unsigned long addr, int numpages)
 670 {
 671         return change_page_attr_clear(addr, numpages, __pgprot(_PAGE_PRESENT));
 672 }
 673
 674 int set_pages_uc(struct page *page, int numpages)
 675 {
 676         unsigned long addr = (unsigned long)page_address(page);
 677
 678         return set_memory_uc(addr, numpages);
 679 }
 680 EXPORT_SYMBOL(set_pages_uc);
 681
 682 int set_pages_wb(struct page *page, int numpages)
 683 {
 684         unsigned long addr = (unsigned long)page_address(page);
 685
 686         return set_memory_wb(addr, numpages);
 687 }
 688 EXPORT_SYMBOL(set_pages_wb);
 689
 690 int set_pages_x(struct page *page, int numpages)
 691 {
 692         unsigned long addr = (unsigned long)page_address(page);
 693
 694         return set_memory_x(addr, numpages);
 695 }
 696 EXPORT_SYMBOL(set_pages_x);
 697
 698 int set_pages_nx(struct page *page, int numpages)
 699 {
 700         unsigned long addr = (unsigned long)page_address(page);
 701
 702         return set_memory_nx(addr, numpages);
 703 }
 704 EXPORT_SYMBOL(set_pages_nx);
 705
 706 int set_pages_ro(struct page *page, int numpages)
 707 {
 708         unsigned long addr = (unsigned long)page_address(page);
 709
 710         return set_memory_ro(addr, numpages);
 711 }
 712
 713 int set_pages_rw(struct page *page, int numpages)
 714 {
 715         unsigned long addr = (unsigned long)page_address(page);
 716
 717         return set_memory_rw(addr, numpages);
 718 }
 719
 720 #ifdef CONFIG_DEBUG_PAGEALLOC
 721
 722 static int __set_pages_p(struct page *page, int numpages)
 723 {
 724         struct cpa_data cpa = { .vaddr = (unsigned long) page_address(page),
 725                                 .numpages = numpages,
 726                                 .mask_set = __pgprot(_PAGE_PRESENT | _PAGE_RW),
 727                                 .mask_clr = __pgprot(0)};
 728
 729         return __change_page_attr_set_clr(&cpa);
 730 }
 731
 732 static int __set_pages_np(struct page *page, int numpages)
 733 {
 734         struct cpa_data cpa = { .vaddr = (unsigned long) page_address(page),
 735                                 .numpages = numpages,
 736                                 .mask_set = __pgprot(0),
 737                                 .mask_clr = __pgprot(_PAGE_PRESENT | _PAGE_RW)};
 738
 739         return __change_page_attr_set_clr(&cpa);
 740 }
 741
 742 void kernel_map_pages(struct page *page, int numpages, int enable)
 743 {
 744         if (PageHighMem(page))
 745                 return;
 746         if (!enable) {
 747                 debug_check_no_locks_freed(page_address(page),
 748                                            numpages * PAGE_SIZE);
 749         }
 750
 751         /*
 752          * If page allocator is not up yet then do not call c_p_a():
 753          */
 754         if (!debug_pagealloc_enabled)
 755                 return;
 756
 757         /*
 758          * The return value is ignored - the calls cannot fail,
 759          * large pages are disabled at boot time:
 760          */
 761         if (enable)
 762                 __set_pages_p(page, numpages);
 763         else
 764                 __set_pages_np(page, numpages);
 765
 766         /*
 767          * We should perform an IPI and flush all tlbs,
 768          * but that can deadlock->flush only current cpu:
 769          */
 770         __flush_tlb_all();
 771 }
 772 #endif
 773
 774 /*
 775  * The testcases use internal knowledge of the implementation that shouldn't
 776  * be exposed to the rest of the kernel. Include these directly here.
 777  */
 778 #ifdef CONFIG_CPA_DEBUG
 779 #include "pageattr-test.c"
 780 #endif