0001
0002
0003
0004
0005
0006
0007
0008
0009
0010
0011
0012
0013
0014
0015
0016
0017
0018
0019
0020 #include <linux/mm.h>
0021 #include <linux/export.h>
0022 #include <linux/swap.h>
0023 #include <linux/bio.h>
0024 #include <linux/pagemap.h>
0025 #include <linux/mempool.h>
0026 #include <linux/init.h>
0027 #include <linux/hash.h>
0028 #include <linux/highmem.h>
0029 #include <linux/kgdb.h>
0030 #include <asm/tlbflush.h>
0031 #include <linux/vmalloc.h>
0032
0033
0034
0035
0036
0037
0038
0039
0040
0041 #ifdef CONFIG_HIGHMEM
0042
0043
0044
0045
0046
0047
0048 #ifndef get_pkmap_color
0049
0050
0051
0052
0053 static inline unsigned int get_pkmap_color(struct page *page)
0054 {
0055 return 0;
0056 }
0057 #define get_pkmap_color get_pkmap_color
0058
0059
0060
0061
0062 static inline unsigned int get_next_pkmap_nr(unsigned int color)
0063 {
0064 static unsigned int last_pkmap_nr;
0065
0066 last_pkmap_nr = (last_pkmap_nr + 1) & LAST_PKMAP_MASK;
0067 return last_pkmap_nr;
0068 }
0069
0070
0071
0072
0073
0074
0075 static inline int no_more_pkmaps(unsigned int pkmap_nr, unsigned int color)
0076 {
0077 return pkmap_nr == 0;
0078 }
0079
0080
0081
0082
0083
0084
0085 static inline int get_pkmap_entries_count(unsigned int color)
0086 {
0087 return LAST_PKMAP;
0088 }
0089
0090
0091
0092
0093
0094
0095 static inline wait_queue_head_t *get_pkmap_wait_queue_head(unsigned int color)
0096 {
0097 static DECLARE_WAIT_QUEUE_HEAD(pkmap_map_wait);
0098
0099 return &pkmap_map_wait;
0100 }
0101 #endif
0102
0103 atomic_long_t _totalhigh_pages __read_mostly;
0104 EXPORT_SYMBOL(_totalhigh_pages);
0105
0106 unsigned int __nr_free_highpages(void)
0107 {
0108 struct zone *zone;
0109 unsigned int pages = 0;
0110
0111 for_each_populated_zone(zone) {
0112 if (is_highmem(zone))
0113 pages += zone_page_state(zone, NR_FREE_PAGES);
0114 }
0115
0116 return pages;
0117 }
0118
0119 static int pkmap_count[LAST_PKMAP];
0120 static __cacheline_aligned_in_smp DEFINE_SPINLOCK(kmap_lock);
0121
0122 pte_t *pkmap_page_table;
0123
0124
0125
0126
0127
0128
0129 #ifdef ARCH_NEEDS_KMAP_HIGH_GET
0130 #define lock_kmap() spin_lock_irq(&kmap_lock)
0131 #define unlock_kmap() spin_unlock_irq(&kmap_lock)
0132 #define lock_kmap_any(flags) spin_lock_irqsave(&kmap_lock, flags)
0133 #define unlock_kmap_any(flags) spin_unlock_irqrestore(&kmap_lock, flags)
0134 #else
0135 #define lock_kmap() spin_lock(&kmap_lock)
0136 #define unlock_kmap() spin_unlock(&kmap_lock)
0137 #define lock_kmap_any(flags) \
0138 do { spin_lock(&kmap_lock); (void)(flags); } while (0)
0139 #define unlock_kmap_any(flags) \
0140 do { spin_unlock(&kmap_lock); (void)(flags); } while (0)
0141 #endif
0142
0143 struct page *__kmap_to_page(void *vaddr)
0144 {
0145 unsigned long addr = (unsigned long)vaddr;
0146
0147 if (addr >= PKMAP_ADDR(0) && addr < PKMAP_ADDR(LAST_PKMAP)) {
0148 int i = PKMAP_NR(addr);
0149
0150 return pte_page(pkmap_page_table[i]);
0151 }
0152
0153 return virt_to_page(vaddr);
0154 }
0155 EXPORT_SYMBOL(__kmap_to_page);
0156
0157 static void flush_all_zero_pkmaps(void)
0158 {
0159 int i;
0160 int need_flush = 0;
0161
0162 flush_cache_kmaps();
0163
0164 for (i = 0; i < LAST_PKMAP; i++) {
0165 struct page *page;
0166
0167
0168
0169
0170
0171
0172
0173 if (pkmap_count[i] != 1)
0174 continue;
0175 pkmap_count[i] = 0;
0176
0177
0178 BUG_ON(pte_none(pkmap_page_table[i]));
0179
0180
0181
0182
0183
0184
0185
0186
0187 page = pte_page(pkmap_page_table[i]);
0188 pte_clear(&init_mm, PKMAP_ADDR(i), &pkmap_page_table[i]);
0189
0190 set_page_address(page, NULL);
0191 need_flush = 1;
0192 }
0193 if (need_flush)
0194 flush_tlb_kernel_range(PKMAP_ADDR(0), PKMAP_ADDR(LAST_PKMAP));
0195 }
0196
0197 void __kmap_flush_unused(void)
0198 {
0199 lock_kmap();
0200 flush_all_zero_pkmaps();
0201 unlock_kmap();
0202 }
0203
0204 static inline unsigned long map_new_virtual(struct page *page)
0205 {
0206 unsigned long vaddr;
0207 int count;
0208 unsigned int last_pkmap_nr;
0209 unsigned int color = get_pkmap_color(page);
0210
0211 start:
0212 count = get_pkmap_entries_count(color);
0213
0214 for (;;) {
0215 last_pkmap_nr = get_next_pkmap_nr(color);
0216 if (no_more_pkmaps(last_pkmap_nr, color)) {
0217 flush_all_zero_pkmaps();
0218 count = get_pkmap_entries_count(color);
0219 }
0220 if (!pkmap_count[last_pkmap_nr])
0221 break;
0222 if (--count)
0223 continue;
0224
0225
0226
0227
0228 {
0229 DECLARE_WAITQUEUE(wait, current);
0230 wait_queue_head_t *pkmap_map_wait =
0231 get_pkmap_wait_queue_head(color);
0232
0233 __set_current_state(TASK_UNINTERRUPTIBLE);
0234 add_wait_queue(pkmap_map_wait, &wait);
0235 unlock_kmap();
0236 schedule();
0237 remove_wait_queue(pkmap_map_wait, &wait);
0238 lock_kmap();
0239
0240
0241 if (page_address(page))
0242 return (unsigned long)page_address(page);
0243
0244
0245 goto start;
0246 }
0247 }
0248 vaddr = PKMAP_ADDR(last_pkmap_nr);
0249 set_pte_at(&init_mm, vaddr,
0250 &(pkmap_page_table[last_pkmap_nr]), mk_pte(page, kmap_prot));
0251
0252 pkmap_count[last_pkmap_nr] = 1;
0253 set_page_address(page, (void *)vaddr);
0254
0255 return vaddr;
0256 }
0257
0258
0259
0260
0261
0262
0263
0264
0265
0266 void *kmap_high(struct page *page)
0267 {
0268 unsigned long vaddr;
0269
0270
0271
0272
0273
0274 lock_kmap();
0275 vaddr = (unsigned long)page_address(page);
0276 if (!vaddr)
0277 vaddr = map_new_virtual(page);
0278 pkmap_count[PKMAP_NR(vaddr)]++;
0279 BUG_ON(pkmap_count[PKMAP_NR(vaddr)] < 2);
0280 unlock_kmap();
0281 return (void *) vaddr;
0282 }
0283 EXPORT_SYMBOL(kmap_high);
0284
0285 #ifdef ARCH_NEEDS_KMAP_HIGH_GET
0286
0287
0288
0289
0290
0291
0292
0293
0294
0295
0296 void *kmap_high_get(struct page *page)
0297 {
0298 unsigned long vaddr, flags;
0299
0300 lock_kmap_any(flags);
0301 vaddr = (unsigned long)page_address(page);
0302 if (vaddr) {
0303 BUG_ON(pkmap_count[PKMAP_NR(vaddr)] < 1);
0304 pkmap_count[PKMAP_NR(vaddr)]++;
0305 }
0306 unlock_kmap_any(flags);
0307 return (void *) vaddr;
0308 }
0309 #endif
0310
0311
0312
0313
0314
0315
0316
0317
0318 void kunmap_high(struct page *page)
0319 {
0320 unsigned long vaddr;
0321 unsigned long nr;
0322 unsigned long flags;
0323 int need_wakeup;
0324 unsigned int color = get_pkmap_color(page);
0325 wait_queue_head_t *pkmap_map_wait;
0326
0327 lock_kmap_any(flags);
0328 vaddr = (unsigned long)page_address(page);
0329 BUG_ON(!vaddr);
0330 nr = PKMAP_NR(vaddr);
0331
0332
0333
0334
0335
0336 need_wakeup = 0;
0337 switch (--pkmap_count[nr]) {
0338 case 0:
0339 BUG();
0340 case 1:
0341
0342
0343
0344
0345
0346
0347
0348
0349
0350
0351 pkmap_map_wait = get_pkmap_wait_queue_head(color);
0352 need_wakeup = waitqueue_active(pkmap_map_wait);
0353 }
0354 unlock_kmap_any(flags);
0355
0356
0357 if (need_wakeup)
0358 wake_up(pkmap_map_wait);
0359 }
0360 EXPORT_SYMBOL(kunmap_high);
0361
0362 void zero_user_segments(struct page *page, unsigned start1, unsigned end1,
0363 unsigned start2, unsigned end2)
0364 {
0365 unsigned int i;
0366
0367 BUG_ON(end1 > page_size(page) || end2 > page_size(page));
0368
0369 if (start1 >= end1)
0370 start1 = end1 = 0;
0371 if (start2 >= end2)
0372 start2 = end2 = 0;
0373
0374 for (i = 0; i < compound_nr(page); i++) {
0375 void *kaddr = NULL;
0376
0377 if (start1 >= PAGE_SIZE) {
0378 start1 -= PAGE_SIZE;
0379 end1 -= PAGE_SIZE;
0380 } else {
0381 unsigned this_end = min_t(unsigned, end1, PAGE_SIZE);
0382
0383 if (end1 > start1) {
0384 kaddr = kmap_local_page(page + i);
0385 memset(kaddr + start1, 0, this_end - start1);
0386 }
0387 end1 -= this_end;
0388 start1 = 0;
0389 }
0390
0391 if (start2 >= PAGE_SIZE) {
0392 start2 -= PAGE_SIZE;
0393 end2 -= PAGE_SIZE;
0394 } else {
0395 unsigned this_end = min_t(unsigned, end2, PAGE_SIZE);
0396
0397 if (end2 > start2) {
0398 if (!kaddr)
0399 kaddr = kmap_local_page(page + i);
0400 memset(kaddr + start2, 0, this_end - start2);
0401 }
0402 end2 -= this_end;
0403 start2 = 0;
0404 }
0405
0406 if (kaddr) {
0407 kunmap_local(kaddr);
0408 flush_dcache_page(page + i);
0409 }
0410
0411 if (!end1 && !end2)
0412 break;
0413 }
0414
0415 BUG_ON((start1 | start2 | end1 | end2) != 0);
0416 }
0417 EXPORT_SYMBOL(zero_user_segments);
0418 #endif
0419
0420 #ifdef CONFIG_KMAP_LOCAL
0421
0422 #include <asm/kmap_size.h>
0423
0424
0425
0426
0427
0428 #ifdef CONFIG_DEBUG_KMAP_LOCAL
0429 # define KM_INCR 2
0430 #else
0431 # define KM_INCR 1
0432 #endif
0433
0434 static inline int kmap_local_idx_push(void)
0435 {
0436 WARN_ON_ONCE(in_hardirq() && !irqs_disabled());
0437 current->kmap_ctrl.idx += KM_INCR;
0438 BUG_ON(current->kmap_ctrl.idx >= KM_MAX_IDX);
0439 return current->kmap_ctrl.idx - 1;
0440 }
0441
0442 static inline int kmap_local_idx(void)
0443 {
0444 return current->kmap_ctrl.idx - 1;
0445 }
0446
0447 static inline void kmap_local_idx_pop(void)
0448 {
0449 current->kmap_ctrl.idx -= KM_INCR;
0450 BUG_ON(current->kmap_ctrl.idx < 0);
0451 }
0452
0453 #ifndef arch_kmap_local_post_map
0454 # define arch_kmap_local_post_map(vaddr, pteval) do { } while (0)
0455 #endif
0456
0457 #ifndef arch_kmap_local_pre_unmap
0458 # define arch_kmap_local_pre_unmap(vaddr) do { } while (0)
0459 #endif
0460
0461 #ifndef arch_kmap_local_post_unmap
0462 # define arch_kmap_local_post_unmap(vaddr) do { } while (0)
0463 #endif
0464
0465 #ifndef arch_kmap_local_map_idx
0466 #define arch_kmap_local_map_idx(idx, pfn) kmap_local_calc_idx(idx)
0467 #endif
0468
0469 #ifndef arch_kmap_local_unmap_idx
0470 #define arch_kmap_local_unmap_idx(idx, vaddr) kmap_local_calc_idx(idx)
0471 #endif
0472
0473 #ifndef arch_kmap_local_high_get
0474 static inline void *arch_kmap_local_high_get(struct page *page)
0475 {
0476 return NULL;
0477 }
0478 #endif
0479
0480 #ifndef arch_kmap_local_set_pte
0481 #define arch_kmap_local_set_pte(mm, vaddr, ptep, ptev) \
0482 set_pte_at(mm, vaddr, ptep, ptev)
0483 #endif
0484
0485
0486 static inline bool kmap_high_unmap_local(unsigned long vaddr)
0487 {
0488 #ifdef ARCH_NEEDS_KMAP_HIGH_GET
0489 if (vaddr >= PKMAP_ADDR(0) && vaddr < PKMAP_ADDR(LAST_PKMAP)) {
0490 kunmap_high(pte_page(pkmap_page_table[PKMAP_NR(vaddr)]));
0491 return true;
0492 }
0493 #endif
0494 return false;
0495 }
0496
0497 static inline int kmap_local_calc_idx(int idx)
0498 {
0499 return idx + KM_MAX_IDX * smp_processor_id();
0500 }
0501
0502 static pte_t *__kmap_pte;
0503
0504 static pte_t *kmap_get_pte(unsigned long vaddr, int idx)
0505 {
0506 if (IS_ENABLED(CONFIG_KMAP_LOCAL_NON_LINEAR_PTE_ARRAY))
0507
0508
0509
0510
0511 return virt_to_kpte(vaddr);
0512 if (!__kmap_pte)
0513 __kmap_pte = virt_to_kpte(__fix_to_virt(FIX_KMAP_BEGIN));
0514 return &__kmap_pte[-idx];
0515 }
0516
0517 void *__kmap_local_pfn_prot(unsigned long pfn, pgprot_t prot)
0518 {
0519 pte_t pteval, *kmap_pte;
0520 unsigned long vaddr;
0521 int idx;
0522
0523
0524
0525
0526
0527 migrate_disable();
0528 preempt_disable();
0529 idx = arch_kmap_local_map_idx(kmap_local_idx_push(), pfn);
0530 vaddr = __fix_to_virt(FIX_KMAP_BEGIN + idx);
0531 kmap_pte = kmap_get_pte(vaddr, idx);
0532 BUG_ON(!pte_none(*kmap_pte));
0533 pteval = pfn_pte(pfn, prot);
0534 arch_kmap_local_set_pte(&init_mm, vaddr, kmap_pte, pteval);
0535 arch_kmap_local_post_map(vaddr, pteval);
0536 current->kmap_ctrl.pteval[kmap_local_idx()] = pteval;
0537 preempt_enable();
0538
0539 return (void *)vaddr;
0540 }
0541 EXPORT_SYMBOL_GPL(__kmap_local_pfn_prot);
0542
0543 void *__kmap_local_page_prot(struct page *page, pgprot_t prot)
0544 {
0545 void *kmap;
0546
0547
0548
0549
0550
0551
0552 if (!IS_ENABLED(CONFIG_DEBUG_KMAP_LOCAL_FORCE_MAP) && !PageHighMem(page))
0553 return page_address(page);
0554
0555
0556 kmap = arch_kmap_local_high_get(page);
0557 if (kmap)
0558 return kmap;
0559
0560 return __kmap_local_pfn_prot(page_to_pfn(page), prot);
0561 }
0562 EXPORT_SYMBOL(__kmap_local_page_prot);
0563
0564 void kunmap_local_indexed(const void *vaddr)
0565 {
0566 unsigned long addr = (unsigned long) vaddr & PAGE_MASK;
0567 pte_t *kmap_pte;
0568 int idx;
0569
0570 if (addr < __fix_to_virt(FIX_KMAP_END) ||
0571 addr > __fix_to_virt(FIX_KMAP_BEGIN)) {
0572 if (IS_ENABLED(CONFIG_DEBUG_KMAP_LOCAL_FORCE_MAP)) {
0573
0574 WARN_ON_ONCE(1);
0575 return;
0576 }
0577
0578
0579
0580
0581
0582
0583 if (!kmap_high_unmap_local(addr))
0584 WARN_ON_ONCE(addr < PAGE_OFFSET);
0585 return;
0586 }
0587
0588 preempt_disable();
0589 idx = arch_kmap_local_unmap_idx(kmap_local_idx(), addr);
0590 WARN_ON_ONCE(addr != __fix_to_virt(FIX_KMAP_BEGIN + idx));
0591
0592 kmap_pte = kmap_get_pte(addr, idx);
0593 arch_kmap_local_pre_unmap(addr);
0594 pte_clear(&init_mm, addr, kmap_pte);
0595 arch_kmap_local_post_unmap(addr);
0596 current->kmap_ctrl.pteval[kmap_local_idx()] = __pte(0);
0597 kmap_local_idx_pop();
0598 preempt_enable();
0599 migrate_enable();
0600 }
0601 EXPORT_SYMBOL(kunmap_local_indexed);
0602
0603
0604
0605
0606
0607
0608
0609
0610
0611
0612
0613 void __kmap_local_sched_out(void)
0614 {
0615 struct task_struct *tsk = current;
0616 pte_t *kmap_pte;
0617 int i;
0618
0619
0620 for (i = 0; i < tsk->kmap_ctrl.idx; i++) {
0621 pte_t pteval = tsk->kmap_ctrl.pteval[i];
0622 unsigned long addr;
0623 int idx;
0624
0625
0626 if (IS_ENABLED(CONFIG_DEBUG_KMAP_LOCAL) && !(i & 0x01)) {
0627 WARN_ON_ONCE(pte_val(pteval) != 0);
0628 continue;
0629 }
0630 if (WARN_ON_ONCE(pte_none(pteval)))
0631 continue;
0632
0633
0634
0635
0636
0637
0638
0639
0640 idx = arch_kmap_local_map_idx(i, pte_pfn(pteval));
0641
0642 addr = __fix_to_virt(FIX_KMAP_BEGIN + idx);
0643 kmap_pte = kmap_get_pte(addr, idx);
0644 arch_kmap_local_pre_unmap(addr);
0645 pte_clear(&init_mm, addr, kmap_pte);
0646 arch_kmap_local_post_unmap(addr);
0647 }
0648 }
0649
0650 void __kmap_local_sched_in(void)
0651 {
0652 struct task_struct *tsk = current;
0653 pte_t *kmap_pte;
0654 int i;
0655
0656
0657 for (i = 0; i < tsk->kmap_ctrl.idx; i++) {
0658 pte_t pteval = tsk->kmap_ctrl.pteval[i];
0659 unsigned long addr;
0660 int idx;
0661
0662
0663 if (IS_ENABLED(CONFIG_DEBUG_KMAP_LOCAL) && !(i & 0x01)) {
0664 WARN_ON_ONCE(pte_val(pteval) != 0);
0665 continue;
0666 }
0667 if (WARN_ON_ONCE(pte_none(pteval)))
0668 continue;
0669
0670
0671 idx = arch_kmap_local_map_idx(i, pte_pfn(pteval));
0672 addr = __fix_to_virt(FIX_KMAP_BEGIN + idx);
0673 kmap_pte = kmap_get_pte(addr, idx);
0674 set_pte_at(&init_mm, addr, kmap_pte, pteval);
0675 arch_kmap_local_post_map(addr, pteval);
0676 }
0677 }
0678
0679 void kmap_local_fork(struct task_struct *tsk)
0680 {
0681 if (WARN_ON_ONCE(tsk->kmap_ctrl.idx))
0682 memset(&tsk->kmap_ctrl, 0, sizeof(tsk->kmap_ctrl));
0683 }
0684
0685 #endif
0686
0687 #if defined(HASHED_PAGE_VIRTUAL)
0688
0689 #define PA_HASH_ORDER 7
0690
0691
0692
0693
0694 struct page_address_map {
0695 struct page *page;
0696 void *virtual;
0697 struct list_head list;
0698 };
0699
0700 static struct page_address_map page_address_maps[LAST_PKMAP];
0701
0702
0703
0704
0705 static struct page_address_slot {
0706 struct list_head lh;
0707 spinlock_t lock;
0708 } ____cacheline_aligned_in_smp page_address_htable[1<<PA_HASH_ORDER];
0709
0710 static struct page_address_slot *page_slot(const struct page *page)
0711 {
0712 return &page_address_htable[hash_ptr(page, PA_HASH_ORDER)];
0713 }
0714
0715
0716
0717
0718
0719
0720
0721 void *page_address(const struct page *page)
0722 {
0723 unsigned long flags;
0724 void *ret;
0725 struct page_address_slot *pas;
0726
0727 if (!PageHighMem(page))
0728 return lowmem_page_address(page);
0729
0730 pas = page_slot(page);
0731 ret = NULL;
0732 spin_lock_irqsave(&pas->lock, flags);
0733 if (!list_empty(&pas->lh)) {
0734 struct page_address_map *pam;
0735
0736 list_for_each_entry(pam, &pas->lh, list) {
0737 if (pam->page == page) {
0738 ret = pam->virtual;
0739 break;
0740 }
0741 }
0742 }
0743
0744 spin_unlock_irqrestore(&pas->lock, flags);
0745 return ret;
0746 }
0747 EXPORT_SYMBOL(page_address);
0748
0749
0750
0751
0752
0753
0754 void set_page_address(struct page *page, void *virtual)
0755 {
0756 unsigned long flags;
0757 struct page_address_slot *pas;
0758 struct page_address_map *pam;
0759
0760 BUG_ON(!PageHighMem(page));
0761
0762 pas = page_slot(page);
0763 if (virtual) {
0764 pam = &page_address_maps[PKMAP_NR((unsigned long)virtual)];
0765 pam->page = page;
0766 pam->virtual = virtual;
0767
0768 spin_lock_irqsave(&pas->lock, flags);
0769 list_add_tail(&pam->list, &pas->lh);
0770 spin_unlock_irqrestore(&pas->lock, flags);
0771 } else {
0772 spin_lock_irqsave(&pas->lock, flags);
0773 list_for_each_entry(pam, &pas->lh, list) {
0774 if (pam->page == page) {
0775 list_del(&pam->list);
0776 break;
0777 }
0778 }
0779 spin_unlock_irqrestore(&pas->lock, flags);
0780 }
0781
0782 return;
0783 }
0784
0785 void __init page_address_init(void)
0786 {
0787 int i;
0788
0789 for (i = 0; i < ARRAY_SIZE(page_address_htable); i++) {
0790 INIT_LIST_HEAD(&page_address_htable[i].lh);
0791 spin_lock_init(&page_address_htable[i].lock);
0792 }
0793 }
0794
0795 #endif