]> bbs.cooldavid.org Git - net-next-2.6.git/blame - fs/ramfs/file-nommu.c
nommu: fix race between ramfs truncation and shared mmap
[net-next-2.6.git] / fs / ramfs / file-nommu.c
CommitLineData
642fb4d1
DH
1/* file-nommu.c: no-MMU version of ramfs
2 *
3 * Copyright (C) 2005 Red Hat, Inc. All Rights Reserved.
4 * Written by David Howells (dhowells@redhat.com)
5 *
6 * This program is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU General Public License
8 * as published by the Free Software Foundation; either version
9 * 2 of the License, or (at your option) any later version.
10 */
11
12#include <linux/module.h>
13#include <linux/fs.h>
131612df 14#include <linux/mm.h>
642fb4d1
DH
15#include <linux/pagemap.h>
16#include <linux/highmem.h>
17#include <linux/init.h>
18#include <linux/string.h>
642fb4d1
DH
19#include <linux/backing-dev.h>
20#include <linux/ramfs.h>
642fb4d1
DH
21#include <linux/pagevec.h>
22#include <linux/mman.h>
5c805365 23#include <linux/sched.h>
642fb4d1
DH
24
25#include <asm/uaccess.h>
26#include "internal.h"
27
28static int ramfs_nommu_setattr(struct dentry *, struct iattr *);
29
f5e54d6e 30const struct address_space_operations ramfs_aops = {
642fb4d1 31 .readpage = simple_readpage,
800d15a5
NP
32 .write_begin = simple_write_begin,
33 .write_end = simple_write_end,
46626296 34 .set_page_dirty = __set_page_dirty_no_writeback,
642fb4d1
DH
35};
36
4b6f5d20 37const struct file_operations ramfs_file_operations = {
642fb4d1
DH
38 .mmap = ramfs_nommu_mmap,
39 .get_unmapped_area = ramfs_nommu_get_unmapped_area,
543ade1f
BP
40 .read = do_sync_read,
41 .aio_read = generic_file_aio_read,
42 .write = do_sync_write,
43 .aio_write = generic_file_aio_write,
642fb4d1 44 .fsync = simple_sync_file,
5ffc4ef4 45 .splice_read = generic_file_splice_read,
8b3d3567 46 .splice_write = generic_file_splice_write,
642fb4d1
DH
47 .llseek = generic_file_llseek,
48};
49
c5ef1c42 50const struct inode_operations ramfs_file_inode_operations = {
642fb4d1
DH
51 .setattr = ramfs_nommu_setattr,
52 .getattr = simple_getattr,
53};
54
55/*****************************************************************************/
56/*
57 * add a contiguous set of pages into a ramfs inode when it's truncated from
58 * size 0 on the assumption that it's going to be used for an mmap of shared
59 * memory
60 */
4b19de6d 61int ramfs_nommu_expand_for_mapping(struct inode *inode, size_t newsize)
642fb4d1 62{
0f67b0b0 63 unsigned long npages, xpages, loop;
642fb4d1
DH
64 struct page *pages;
65 unsigned order;
66 void *data;
67 int ret;
68
69 /* make various checks */
70 order = get_order(newsize);
71 if (unlikely(order >= MAX_ORDER))
c08d3b0e 72 return -EFBIG;
642fb4d1 73
c08d3b0e 74 ret = inode_newsize_ok(inode, newsize);
75 if (ret)
76 return ret;
642fb4d1
DH
77
78 i_size_write(inode, newsize);
79
80 /* allocate enough contiguous pages to be able to satisfy the
81 * request */
82 pages = alloc_pages(mapping_gfp_mask(inode->i_mapping), order);
83 if (!pages)
84 return -ENOMEM;
85
86 /* split the high-order page into an array of single pages */
87 xpages = 1UL << order;
88 npages = (newsize + PAGE_SIZE - 1) >> PAGE_SHIFT;
89
84097518 90 split_page(pages, order);
642fb4d1
DH
91
92 /* trim off any pages we don't actually require */
93 for (loop = npages; loop < xpages; loop++)
94 __free_page(pages + loop);
95
96 /* clear the memory we allocated */
97 newsize = PAGE_SIZE * npages;
98 data = page_address(pages);
99 memset(data, 0, newsize);
100
101 /* attach all the pages to the inode's address space */
642fb4d1
DH
102 for (loop = 0; loop < npages; loop++) {
103 struct page *page = pages + loop;
104
2678958e
JW
105 ret = add_to_page_cache_lru(page, inode->i_mapping, loop,
106 GFP_KERNEL);
642fb4d1
DH
107 if (ret < 0)
108 goto add_error;
109
020fe22f
EB
110 /* prevent the page from being discarded on memory pressure */
111 SetPageDirty(page);
112
642fb4d1
DH
113 unlock_page(page);
114 }
115
642fb4d1
DH
116 return 0;
117
c08d3b0e 118add_error:
2678958e
JW
119 while (loop < npages)
120 __free_page(pages + loop++);
642fb4d1
DH
121 return ret;
122}
123
124/*****************************************************************************/
125/*
126 * check that file shrinkage doesn't leave any VMAs dangling in midair
127 */
128static int ramfs_nommu_check_mappings(struct inode *inode,
129 size_t newsize, size_t size)
130{
131 struct vm_area_struct *vma;
132 struct prio_tree_iter iter;
133
81759b5b
DH
134 down_write(&nommu_region_sem);
135
642fb4d1
DH
136 /* search for VMAs that fall within the dead zone */
137 vma_prio_tree_foreach(vma, &iter, &inode->i_mapping->i_mmap,
138 newsize >> PAGE_SHIFT,
139 (size + PAGE_SIZE - 1) >> PAGE_SHIFT
140 ) {
141 /* found one - only interested if it's shared out of the page
142 * cache */
81759b5b
DH
143 if (vma->vm_flags & VM_SHARED) {
144 up_write(&nommu_region_sem);
642fb4d1 145 return -ETXTBSY; /* not quite true, but near enough */
81759b5b 146 }
642fb4d1
DH
147 }
148
81759b5b 149 up_write(&nommu_region_sem);
642fb4d1
DH
150 return 0;
151}
152
153/*****************************************************************************/
154/*
155 *
156 */
157static int ramfs_nommu_resize(struct inode *inode, loff_t newsize, loff_t size)
158{
159 int ret;
160
161 /* assume a truncate from zero size is going to be for the purposes of
162 * shared mmap */
163 if (size == 0) {
164 if (unlikely(newsize >> 32))
165 return -EFBIG;
166
167 return ramfs_nommu_expand_for_mapping(inode, newsize);
168 }
169
170 /* check that a decrease in size doesn't cut off any shared mappings */
171 if (newsize < size) {
172 ret = ramfs_nommu_check_mappings(inode, newsize, size);
173 if (ret < 0)
174 return ret;
175 }
176
3f0a6766 177 ret = vmtruncate(inode, newsize);
642fb4d1
DH
178
179 return ret;
180}
181
182/*****************************************************************************/
183/*
184 * handle a change of attributes
185 * - we're specifically interested in a change of size
186 */
187static int ramfs_nommu_setattr(struct dentry *dentry, struct iattr *ia)
188{
189 struct inode *inode = dentry->d_inode;
190 unsigned int old_ia_valid = ia->ia_valid;
191 int ret = 0;
192
85f6038f
BW
193 /* POSIX UID/GID verification for setting inode attributes */
194 ret = inode_change_ok(inode, ia);
195 if (ret)
196 return ret;
197
642fb4d1
DH
198 /* pick out size-changing events */
199 if (ia->ia_valid & ATTR_SIZE) {
200 loff_t size = i_size_read(inode);
201 if (ia->ia_size != size) {
202 ret = ramfs_nommu_resize(inode, ia->ia_size, size);
203 if (ret < 0 || ia->ia_valid == ATTR_SIZE)
204 goto out;
205 } else {
206 /* we skipped the truncate but must still update
207 * timestamps
208 */
209 ia->ia_valid |= ATTR_MTIME|ATTR_CTIME;
210 }
211 }
212
213 ret = inode_setattr(inode, ia);
214 out:
215 ia->ia_valid = old_ia_valid;
216 return ret;
217}
218
219/*****************************************************************************/
220/*
221 * try to determine where a shared mapping can be made
222 * - we require that:
223 * - the pages to be mapped must exist
224 * - the pages be physically contiguous in sequence
225 */
226unsigned long ramfs_nommu_get_unmapped_area(struct file *file,
227 unsigned long addr, unsigned long len,
228 unsigned long pgoff, unsigned long flags)
229{
230 unsigned long maxpages, lpages, nr, loop, ret;
a57c4d65 231 struct inode *inode = file->f_path.dentry->d_inode;
642fb4d1
DH
232 struct page **pages = NULL, **ptr, *page;
233 loff_t isize;
234
235 if (!(flags & MAP_SHARED))
236 return addr;
237
238 /* the mapping mustn't extend beyond the EOF */
239 lpages = (len + PAGE_SIZE - 1) >> PAGE_SHIFT;
240 isize = i_size_read(inode);
241
242 ret = -EINVAL;
243 maxpages = (isize + PAGE_SIZE - 1) >> PAGE_SHIFT;
244 if (pgoff >= maxpages)
245 goto out;
246
247 if (maxpages - pgoff < lpages)
248 goto out;
249
250 /* gang-find the pages */
251 ret = -ENOMEM;
252 pages = kzalloc(lpages * sizeof(struct page *), GFP_KERNEL);
253 if (!pages)
0e8f989a 254 goto out_free;
642fb4d1
DH
255
256 nr = find_get_pages(inode->i_mapping, pgoff, lpages, pages);
257 if (nr != lpages)
0e8f989a 258 goto out_free_pages; /* leave if some pages were missing */
642fb4d1
DH
259
260 /* check the pages for physical adjacency */
261 ptr = pages;
262 page = *ptr++;
263 page++;
264 for (loop = lpages; loop > 1; loop--)
265 if (*ptr++ != page++)
0e8f989a 266 goto out_free_pages;
642fb4d1
DH
267
268 /* okay - all conditions fulfilled */
269 ret = (unsigned long) page_address(pages[0]);
270
0e8f989a
DH
271out_free_pages:
272 ptr = pages;
273 for (loop = nr; loop > 0; loop--)
274 put_page(*ptr++);
275out_free:
276 kfree(pages);
277out:
642fb4d1
DH
278 return ret;
279}
280
281/*****************************************************************************/
282/*
21ff8216 283 * set up a mapping for shared memory segments
642fb4d1
DH
284 */
285int ramfs_nommu_mmap(struct file *file, struct vm_area_struct *vma)
286{
2e92a3ba
DH
287 if (!(vma->vm_flags & VM_SHARED))
288 return -ENOSYS;
289
290 file_accessed(file);
291 vma->vm_ops = &generic_file_vm_ops;
292 return 0;
642fb4d1 293}