mm: extended batches for generic mmu_gather
[linux-2.6/linux-acpi-2.6/ibm-acpi-2.6.git] / include / asm-generic / tlb.h
blob5a946a08ff9de7f2556e8c82c70a94ef77621c05
1 /* include/asm-generic/tlb.h
3 * Generic TLB shootdown code
5 * Copyright 2001 Red Hat, Inc.
6 * Based on code from mm/memory.c Copyright Linus Torvalds and others.
8 * Copyright 2011 Red Hat, Inc., Peter Zijlstra <pzijlstr@redhat.com>
10 * This program is free software; you can redistribute it and/or
11 * modify it under the terms of the GNU General Public License
12 * as published by the Free Software Foundation; either version
13 * 2 of the License, or (at your option) any later version.
15 #ifndef _ASM_GENERIC__TLB_H
16 #define _ASM_GENERIC__TLB_H
18 #include <linux/swap.h>
19 #include <asm/pgalloc.h>
20 #include <asm/tlbflush.h>
22 #ifdef CONFIG_HAVE_RCU_TABLE_FREE
24 * Semi RCU freeing of the page directories.
26 * This is needed by some architectures to implement software pagetable walkers.
28 * gup_fast() and other software pagetable walkers do a lockless page-table
29 * walk and therefore needs some synchronization with the freeing of the page
30 * directories. The chosen means to accomplish that is by disabling IRQs over
31 * the walk.
33 * Architectures that use IPIs to flush TLBs will then automagically DTRT,
34 * since we unlink the page, flush TLBs, free the page. Since the disabling of
35 * IRQs delays the completion of the TLB flush we can never observe an already
36 * freed page.
38 * Architectures that do not have this (PPC) need to delay the freeing by some
39 * other means, this is that means.
41 * What we do is batch the freed directory pages (tables) and RCU free them.
42 * We use the sched RCU variant, as that guarantees that IRQ/preempt disabling
43 * holds off grace periods.
45 * However, in order to batch these pages we need to allocate storage, this
46 * allocation is deep inside the MM code and can thus easily fail on memory
47 * pressure. To guarantee progress we fall back to single table freeing, see
48 * the implementation of tlb_remove_table_one().
51 struct mmu_table_batch {
52 struct rcu_head rcu;
53 unsigned int nr;
54 void *tables[0];
57 #define MAX_TABLE_BATCH \
58 ((PAGE_SIZE - sizeof(struct mmu_table_batch)) / sizeof(void *))
60 extern void tlb_table_flush(struct mmu_gather *tlb);
61 extern void tlb_remove_table(struct mmu_gather *tlb, void *table);
63 #endif
66 * If we can't allocate a page to make a big batch of page pointers
67 * to work on, then just handle a few from the on-stack structure.
69 #define MMU_GATHER_BUNDLE 8
71 struct mmu_gather_batch {
72 struct mmu_gather_batch *next;
73 unsigned int nr;
74 unsigned int max;
75 struct page *pages[0];
78 #define MAX_GATHER_BATCH \
79 ((PAGE_SIZE - sizeof(struct mmu_gather_batch)) / sizeof(void *))
81 /* struct mmu_gather is an opaque type used by the mm code for passing around
82 * any data needed by arch specific code for tlb_remove_page.
84 struct mmu_gather {
85 struct mm_struct *mm;
86 #ifdef CONFIG_HAVE_RCU_TABLE_FREE
87 struct mmu_table_batch *batch;
88 #endif
89 unsigned int need_flush : 1, /* Did free PTEs */
90 fast_mode : 1; /* No batching */
92 unsigned int fullmm;
94 struct mmu_gather_batch *active;
95 struct mmu_gather_batch local;
96 struct page *__pages[MMU_GATHER_BUNDLE];
100 * For UP we don't need to worry about TLB flush
101 * and page free order so much..
103 #ifdef CONFIG_SMP
104 #define tlb_fast_mode(tlb) (tlb->fast_mode)
105 #else
106 #define tlb_fast_mode(tlb) 1
107 #endif
109 static inline int tlb_next_batch(struct mmu_gather *tlb)
111 struct mmu_gather_batch *batch;
113 batch = tlb->active;
114 if (batch->next) {
115 tlb->active = batch->next;
116 return 1;
119 batch = (void *)__get_free_pages(GFP_NOWAIT | __GFP_NOWARN, 0);
120 if (!batch)
121 return 0;
123 batch->next = NULL;
124 batch->nr = 0;
125 batch->max = MAX_GATHER_BATCH;
127 tlb->active->next = batch;
128 tlb->active = batch;
130 return 1;
133 /* tlb_gather_mmu
134 * Called to initialize an (on-stack) mmu_gather structure for page-table
135 * tear-down from @mm. The @fullmm argument is used when @mm is without
136 * users and we're going to destroy the full address space (exit/execve).
138 static inline void
139 tlb_gather_mmu(struct mmu_gather *tlb, struct mm_struct *mm, bool fullmm)
141 tlb->mm = mm;
143 tlb->fullmm = fullmm;
144 tlb->need_flush = 0;
145 tlb->fast_mode = (num_possible_cpus() == 1);
146 tlb->local.next = NULL;
147 tlb->local.nr = 0;
148 tlb->local.max = ARRAY_SIZE(tlb->__pages);
149 tlb->active = &tlb->local;
151 #ifdef CONFIG_HAVE_RCU_TABLE_FREE
152 tlb->batch = NULL;
153 #endif
156 static inline void
157 tlb_flush_mmu(struct mmu_gather *tlb)
159 struct mmu_gather_batch *batch;
161 if (!tlb->need_flush)
162 return;
163 tlb->need_flush = 0;
164 tlb_flush(tlb);
165 #ifdef CONFIG_HAVE_RCU_TABLE_FREE
166 tlb_table_flush(tlb);
167 #endif
169 if (tlb_fast_mode(tlb))
170 return;
172 for (batch = &tlb->local; batch; batch = batch->next) {
173 free_pages_and_swap_cache(batch->pages, batch->nr);
174 batch->nr = 0;
176 tlb->active = &tlb->local;
179 /* tlb_finish_mmu
180 * Called at the end of the shootdown operation to free up any resources
181 * that were required.
183 static inline void
184 tlb_finish_mmu(struct mmu_gather *tlb, unsigned long start, unsigned long end)
186 struct mmu_gather_batch *batch, *next;
188 tlb_flush_mmu(tlb);
190 /* keep the page table cache within bounds */
191 check_pgt_cache();
193 for (batch = tlb->local.next; batch; batch = next) {
194 next = batch->next;
195 free_pages((unsigned long)batch, 0);
197 tlb->local.next = NULL;
200 /* __tlb_remove_page
201 * Must perform the equivalent to __free_pte(pte_get_and_clear(ptep)), while
202 * handling the additional races in SMP caused by other CPUs caching valid
203 * mappings in their TLBs. Returns the number of free page slots left.
204 * When out of page slots we must call tlb_flush_mmu().
206 static inline int __tlb_remove_page(struct mmu_gather *tlb, struct page *page)
208 struct mmu_gather_batch *batch;
210 tlb->need_flush = 1;
212 if (tlb_fast_mode(tlb)) {
213 free_page_and_swap_cache(page);
214 return 1; /* avoid calling tlb_flush_mmu() */
217 batch = tlb->active;
218 batch->pages[batch->nr++] = page;
219 VM_BUG_ON(batch->nr > batch->max);
220 if (batch->nr == batch->max) {
221 if (!tlb_next_batch(tlb))
222 return 0;
225 return batch->max - batch->nr;
228 /* tlb_remove_page
229 * Similar to __tlb_remove_page but will call tlb_flush_mmu() itself when
230 * required.
232 static inline void tlb_remove_page(struct mmu_gather *tlb, struct page *page)
234 if (!__tlb_remove_page(tlb, page))
235 tlb_flush_mmu(tlb);
239 * tlb_remove_tlb_entry - remember a pte unmapping for later tlb invalidation.
241 * Record the fact that pte's were really umapped in ->need_flush, so we can
242 * later optimise away the tlb invalidate. This helps when userspace is
243 * unmapping already-unmapped pages, which happens quite a lot.
245 #define tlb_remove_tlb_entry(tlb, ptep, address) \
246 do { \
247 tlb->need_flush = 1; \
248 __tlb_remove_tlb_entry(tlb, ptep, address); \
249 } while (0)
251 #define pte_free_tlb(tlb, ptep, address) \
252 do { \
253 tlb->need_flush = 1; \
254 __pte_free_tlb(tlb, ptep, address); \
255 } while (0)
257 #ifndef __ARCH_HAS_4LEVEL_HACK
258 #define pud_free_tlb(tlb, pudp, address) \
259 do { \
260 tlb->need_flush = 1; \
261 __pud_free_tlb(tlb, pudp, address); \
262 } while (0)
263 #endif
265 #define pmd_free_tlb(tlb, pmdp, address) \
266 do { \
267 tlb->need_flush = 1; \
268 __pmd_free_tlb(tlb, pmdp, address); \
269 } while (0)
271 #define tlb_migrate_finish(mm) do {} while (0)
273 #endif /* _ASM_GENERIC__TLB_H */