]> bbs.cooldavid.org Git - net-next-2.6.git/blame - include/linux/rmap.h
mm: change anon_vma linking to fix multi-process server scalability issue
[net-next-2.6.git] / include / linux / rmap.h
CommitLineData
1da177e4
LT
1#ifndef _LINUX_RMAP_H
2#define _LINUX_RMAP_H
3/*
4 * Declarations for Reverse Mapping functions in mm/rmap.c
5 */
6
1da177e4
LT
7#include <linux/list.h>
8#include <linux/slab.h>
9#include <linux/mm.h>
10#include <linux/spinlock.h>
bed7161a 11#include <linux/memcontrol.h>
1da177e4
LT
12
13/*
14 * The anon_vma heads a list of private "related" vmas, to scan if
15 * an anonymous page pointing to this anon_vma needs to be unmapped:
16 * the vmas on the list will be related by forking, or by splitting.
17 *
18 * Since vmas come and go as they are split and merged (particularly
19 * in mprotect), the mapping field of an anonymous page cannot point
20 * directly to a vma: instead it points to an anon_vma, on whose list
21 * the related vmas can be easily linked or unlinked.
22 *
23 * After unlinking the last vma on the list, we must garbage collect
24 * the anon_vma object itself: we're guaranteed no page can be
25 * pointing to this anon_vma once its vma list is empty.
26 */
27struct anon_vma {
28 spinlock_t lock; /* Serialize access to vma list */
db114b83
HD
29#ifdef CONFIG_KSM
30 atomic_t ksm_refcount;
31#endif
7906d00c
AA
32 /*
33 * NOTE: the LSB of the head.next is set by
34 * mm_take_all_locks() _after_ taking the above lock. So the
35 * head must only be read/written after taking the above lock
36 * to be sure to see a valid next pointer. The LSB bit itself
37 * is serialized by a system wide lock only visible to
38 * mm_take_all_locks() (mm_all_locks_mutex).
39 */
5beb4930
RR
40 struct list_head head; /* Chain of private "related" vmas */
41};
42
43/*
44 * The copy-on-write semantics of fork mean that an anon_vma
45 * can become associated with multiple processes. Furthermore,
46 * each child process will have its own anon_vma, where new
47 * pages for that process are instantiated.
48 *
49 * This structure allows us to find the anon_vmas associated
50 * with a VMA, or the VMAs associated with an anon_vma.
51 * The "same_vma" list contains the anon_vma_chains linking
52 * all the anon_vmas associated with this VMA.
53 * The "same_anon_vma" list contains the anon_vma_chains
54 * which link all the VMAs associated with this anon_vma.
55 */
56struct anon_vma_chain {
57 struct vm_area_struct *vma;
58 struct anon_vma *anon_vma;
59 struct list_head same_vma; /* locked by mmap_sem & page_table_lock */
60 struct list_head same_anon_vma; /* locked by anon_vma->lock */
1da177e4
LT
61};
62
63#ifdef CONFIG_MMU
db114b83
HD
64#ifdef CONFIG_KSM
65static inline void ksm_refcount_init(struct anon_vma *anon_vma)
66{
67 atomic_set(&anon_vma->ksm_refcount, 0);
68}
69
70static inline int ksm_refcount(struct anon_vma *anon_vma)
71{
72 return atomic_read(&anon_vma->ksm_refcount);
73}
74#else
75static inline void ksm_refcount_init(struct anon_vma *anon_vma)
76{
77}
78
79static inline int ksm_refcount(struct anon_vma *anon_vma)
80{
81 return 0;
82}
83#endif /* CONFIG_KSM */
1da177e4 84
3ca7b3c5
HD
85static inline struct anon_vma *page_anon_vma(struct page *page)
86{
87 if (((unsigned long)page->mapping & PAGE_MAPPING_FLAGS) !=
88 PAGE_MAPPING_ANON)
89 return NULL;
90 return page_rmapping(page);
91}
92
1da177e4
LT
93static inline void anon_vma_lock(struct vm_area_struct *vma)
94{
95 struct anon_vma *anon_vma = vma->anon_vma;
96 if (anon_vma)
97 spin_lock(&anon_vma->lock);
98}
99
100static inline void anon_vma_unlock(struct vm_area_struct *vma)
101{
102 struct anon_vma *anon_vma = vma->anon_vma;
103 if (anon_vma)
104 spin_unlock(&anon_vma->lock);
105}
106
107/*
108 * anon_vma helper functions.
109 */
110void anon_vma_init(void); /* create anon_vma_cachep */
111int anon_vma_prepare(struct vm_area_struct *);
5beb4930
RR
112void unlink_anon_vmas(struct vm_area_struct *);
113int anon_vma_clone(struct vm_area_struct *, struct vm_area_struct *);
114int anon_vma_fork(struct vm_area_struct *, struct vm_area_struct *);
1da177e4 115void __anon_vma_link(struct vm_area_struct *);
db114b83 116void anon_vma_free(struct anon_vma *);
1da177e4 117
5beb4930
RR
118static inline void anon_vma_merge(struct vm_area_struct *vma,
119 struct vm_area_struct *next)
120{
121 VM_BUG_ON(vma->anon_vma != next->anon_vma);
122 unlink_anon_vmas(next);
123}
124
1da177e4
LT
125/*
126 * rmap interfaces called when adding or removing pte of page
127 */
128void page_add_anon_rmap(struct page *, struct vm_area_struct *, unsigned long);
9617d95e 129void page_add_new_anon_rmap(struct page *, struct vm_area_struct *, unsigned long);
1da177e4 130void page_add_file_rmap(struct page *);
edc315fd 131void page_remove_rmap(struct page *);
1da177e4 132
21333b2b 133static inline void page_dup_rmap(struct page *page)
1da177e4
LT
134{
135 atomic_inc(&page->_mapcount);
136}
137
138/*
139 * Called from mm/vmscan.c to handle paging out
140 */
6fe6b7e3
WF
141int page_referenced(struct page *, int is_locked,
142 struct mem_cgroup *cnt, unsigned long *vm_flags);
5ad64688
HD
143int page_referenced_one(struct page *, struct vm_area_struct *,
144 unsigned long address, unsigned int *mapcount, unsigned long *vm_flags);
145
14fa31b8
AK
146enum ttu_flags {
147 TTU_UNMAP = 0, /* unmap mode */
148 TTU_MIGRATION = 1, /* migration mode */
149 TTU_MUNLOCK = 2, /* munlock mode */
150 TTU_ACTION_MASK = 0xff,
151
152 TTU_IGNORE_MLOCK = (1 << 8), /* ignore mlock */
153 TTU_IGNORE_ACCESS = (1 << 9), /* don't age */
888b9f7c 154 TTU_IGNORE_HWPOISON = (1 << 10),/* corrupted page is recoverable */
14fa31b8
AK
155};
156#define TTU_ACTION(x) ((x) & TTU_ACTION_MASK)
157
158int try_to_unmap(struct page *, enum ttu_flags flags);
5ad64688
HD
159int try_to_unmap_one(struct page *, struct vm_area_struct *,
160 unsigned long address, enum ttu_flags flags);
1da177e4 161
ceffc078
CO
162/*
163 * Called from mm/filemap_xip.c to unmap empty zero page
164 */
c0718806 165pte_t *page_check_address(struct page *, struct mm_struct *,
479db0bf 166 unsigned long, spinlock_t **, int);
ceffc078 167
1da177e4
LT
168/*
169 * Used by swapoff to help locate where page is expected in vma.
170 */
171unsigned long page_address_in_vma(struct page *, struct vm_area_struct *);
172
d08b3851
PZ
173/*
174 * Cleans the PTEs of shared mappings.
175 * (and since clean PTEs should also be readonly, write protects them too)
176 *
177 * returns the number of cleaned PTEs.
178 */
179int page_mkclean(struct page *);
180
b291f000
NP
181/*
182 * called in munlock()/munmap() path to check for other vmas holding
183 * the page mlocked.
184 */
185int try_to_munlock(struct page *);
b291f000 186
10be22df
AK
187/*
188 * Called by memory-failure.c to kill processes.
189 */
190struct anon_vma *page_lock_anon_vma(struct page *page);
191void page_unlock_anon_vma(struct anon_vma *anon_vma);
6a46079c 192int page_mapped_in_vma(struct page *page, struct vm_area_struct *vma);
10be22df 193
e9995ef9
HD
194/*
195 * Called by migrate.c to remove migration ptes, but might be used more later.
196 */
197int rmap_walk(struct page *page, int (*rmap_one)(struct page *,
198 struct vm_area_struct *, unsigned long, void *), void *arg);
199
1da177e4
LT
200#else /* !CONFIG_MMU */
201
202#define anon_vma_init() do {} while (0)
203#define anon_vma_prepare(vma) (0)
204#define anon_vma_link(vma) do {} while (0)
205
01ff53f4
MF
206static inline int page_referenced(struct page *page, int is_locked,
207 struct mem_cgroup *cnt,
208 unsigned long *vm_flags)
209{
210 *vm_flags = 0;
211 return TestClearPageReferenced(page);
212}
213
a48d07af 214#define try_to_unmap(page, refs) SWAP_FAIL
1da177e4 215
d08b3851
PZ
216static inline int page_mkclean(struct page *page)
217{
218 return 0;
219}
220
221
1da177e4
LT
222#endif /* CONFIG_MMU */
223
224/*
225 * Return values of try_to_unmap
226 */
227#define SWAP_SUCCESS 0
228#define SWAP_AGAIN 1
229#define SWAP_FAIL 2
b291f000 230#define SWAP_MLOCK 3
1da177e4
LT
231
232#endif /* _LINUX_RMAP_H */