]>
Commit | Line | Data |
---|---|---|
b3b94faa DT |
1 | /* |
2 | * Copyright (C) Sistina Software, Inc. 1997-2003 All rights reserved. | |
3a8a9a10 | 3 | * Copyright (C) 2004-2006 Red Hat, Inc. All rights reserved. |
b3b94faa DT |
4 | * |
5 | * This copyrighted material is made available to anyone wishing to use, | |
6 | * modify, copy, or redistribute it subject to the terms and conditions | |
e9fc2aa0 | 7 | * of the GNU General Public License version 2. |
b3b94faa DT |
8 | */ |
9 | ||
10 | #include <linux/sched.h> | |
11 | #include <linux/slab.h> | |
12 | #include <linux/spinlock.h> | |
13 | #include <linux/completion.h> | |
14 | #include <linux/buffer_head.h> | |
15 | #include <linux/posix_acl.h> | |
16 | #include <linux/sort.h> | |
5c676f6d | 17 | #include <linux/gfs2_ondisk.h> |
71b86f56 | 18 | #include <linux/crc32.h> |
7d308590 | 19 | #include <linux/lm_interface.h> |
fcb47e0b | 20 | #include <linux/security.h> |
b3b94faa DT |
21 | |
22 | #include "gfs2.h" | |
5c676f6d | 23 | #include "incore.h" |
b3b94faa DT |
24 | #include "acl.h" |
25 | #include "bmap.h" | |
26 | #include "dir.h" | |
27 | #include "eattr.h" | |
28 | #include "glock.h" | |
29 | #include "glops.h" | |
30 | #include "inode.h" | |
31 | #include "log.h" | |
32 | #include "meta_io.h" | |
33 | #include "ops_address.h" | |
b3b94faa DT |
34 | #include "ops_inode.h" |
35 | #include "quota.h" | |
36 | #include "rgrp.h" | |
37 | #include "trans.h" | |
5c676f6d | 38 | #include "util.h" |
b3b94faa | 39 | |
bb8d8a6f SW |
40 | struct gfs2_inum_range_host { |
41 | u64 ir_start; | |
42 | u64 ir_length; | |
43 | }; | |
44 | ||
feaa7bba SW |
45 | static int iget_test(struct inode *inode, void *opaque) |
46 | { | |
47 | struct gfs2_inode *ip = GFS2_I(inode); | |
dbb7cae2 | 48 | u64 *no_addr = opaque; |
feaa7bba | 49 | |
dbb7cae2 | 50 | if (ip->i_no_addr == *no_addr && |
1be38679 | 51 | inode->i_private != NULL) |
feaa7bba | 52 | return 1; |
b3b94faa | 53 | |
feaa7bba SW |
54 | return 0; |
55 | } | |
56 | ||
57 | static int iget_set(struct inode *inode, void *opaque) | |
b3b94faa | 58 | { |
feaa7bba | 59 | struct gfs2_inode *ip = GFS2_I(inode); |
dbb7cae2 | 60 | u64 *no_addr = opaque; |
b3b94faa | 61 | |
dbb7cae2 SW |
62 | inode->i_ino = (unsigned long)*no_addr; |
63 | ip->i_no_addr = *no_addr; | |
feaa7bba SW |
64 | return 0; |
65 | } | |
b3b94faa | 66 | |
dbb7cae2 | 67 | struct inode *gfs2_ilookup(struct super_block *sb, u64 no_addr) |
feaa7bba | 68 | { |
dbb7cae2 SW |
69 | unsigned long hash = (unsigned long)no_addr; |
70 | return ilookup5(sb, hash, iget_test, &no_addr); | |
feaa7bba | 71 | } |
b3b94faa | 72 | |
dbb7cae2 | 73 | static struct inode *gfs2_iget(struct super_block *sb, u64 no_addr) |
feaa7bba | 74 | { |
dbb7cae2 SW |
75 | unsigned long hash = (unsigned long)no_addr; |
76 | return iget5_locked(sb, hash, iget_test, iget_set, &no_addr); | |
b3b94faa DT |
77 | } |
78 | ||
7a9f53b3 BM |
79 | struct gfs2_skip_data { |
80 | u64 no_addr; | |
81 | int skipped; | |
82 | }; | |
83 | ||
84 | static int iget_skip_test(struct inode *inode, void *opaque) | |
85 | { | |
86 | struct gfs2_inode *ip = GFS2_I(inode); | |
87 | struct gfs2_skip_data *data = opaque; | |
88 | ||
89 | if (ip->i_no_addr == data->no_addr && inode->i_private != NULL){ | |
90 | if (inode->i_state & (I_FREEING|I_CLEAR|I_WILL_FREE)){ | |
91 | data->skipped = 1; | |
92 | return 0; | |
93 | } | |
94 | return 1; | |
95 | } | |
96 | return 0; | |
97 | } | |
98 | ||
99 | static int iget_skip_set(struct inode *inode, void *opaque) | |
100 | { | |
101 | struct gfs2_inode *ip = GFS2_I(inode); | |
102 | struct gfs2_skip_data *data = opaque; | |
103 | ||
104 | if (data->skipped) | |
105 | return 1; | |
106 | inode->i_ino = (unsigned long)(data->no_addr); | |
107 | ip->i_no_addr = data->no_addr; | |
108 | return 0; | |
109 | } | |
110 | ||
111 | static struct inode *gfs2_iget_skip(struct super_block *sb, | |
112 | u64 no_addr) | |
113 | { | |
114 | struct gfs2_skip_data data; | |
115 | unsigned long hash = (unsigned long)no_addr; | |
116 | ||
117 | data.no_addr = no_addr; | |
118 | data.skipped = 0; | |
119 | return iget5_locked(sb, hash, iget_skip_test, iget_skip_set, &data); | |
120 | } | |
121 | ||
35dcc52e WC |
122 | /** |
123 | * GFS2 lookup code fills in vfs inode contents based on info obtained | |
124 | * from directory entry inside gfs2_inode_lookup(). This has caused issues | |
125 | * with NFS code path since its get_dentry routine doesn't have the relevant | |
126 | * directory entry when gfs2_inode_lookup() is invoked. Part of the code | |
127 | * segment inside gfs2_inode_lookup code needs to get moved around. | |
128 | * | |
129 | * Clean up I_LOCK and I_NEW as well. | |
130 | **/ | |
131 | ||
132 | void gfs2_set_iop(struct inode *inode) | |
133 | { | |
134 | umode_t mode = inode->i_mode; | |
135 | ||
136 | if (S_ISREG(mode)) { | |
137 | inode->i_op = &gfs2_file_iops; | |
138 | inode->i_fop = &gfs2_file_fops; | |
35dcc52e WC |
139 | } else if (S_ISDIR(mode)) { |
140 | inode->i_op = &gfs2_dir_iops; | |
141 | inode->i_fop = &gfs2_dir_fops; | |
142 | } else if (S_ISLNK(mode)) { | |
143 | inode->i_op = &gfs2_symlink_iops; | |
144 | } else { | |
145 | inode->i_op = &gfs2_dev_iops; | |
146 | } | |
147 | ||
148 | unlock_new_inode(inode); | |
149 | } | |
150 | ||
b3b94faa | 151 | /** |
feaa7bba SW |
152 | * gfs2_inode_lookup - Lookup an inode |
153 | * @sb: The super block | |
dbb7cae2 | 154 | * @no_addr: The inode number |
feaa7bba | 155 | * @type: The type of the inode |
7a9f53b3 | 156 | * @skip_freeing: set this not return an inode if it is currently being freed. |
b3b94faa | 157 | * |
feaa7bba | 158 | * Returns: A VFS inode, or an error |
b3b94faa DT |
159 | */ |
160 | ||
bb9bcf06 WC |
161 | struct inode *gfs2_inode_lookup(struct super_block *sb, |
162 | unsigned int type, | |
163 | u64 no_addr, | |
7a9f53b3 | 164 | u64 no_formal_ino, int skip_freeing) |
b3b94faa | 165 | { |
7a9f53b3 BM |
166 | struct inode *inode; |
167 | struct gfs2_inode *ip; | |
feaa7bba SW |
168 | struct gfs2_glock *io_gl; |
169 | int error; | |
b3b94faa | 170 | |
7a9f53b3 BM |
171 | if (skip_freeing) |
172 | inode = gfs2_iget_skip(sb, no_addr); | |
173 | else | |
174 | inode = gfs2_iget(sb, no_addr); | |
175 | ip = GFS2_I(inode); | |
176 | ||
26d83ded SW |
177 | if (!inode) |
178 | return ERR_PTR(-ENOBUFS); | |
179 | ||
feaa7bba SW |
180 | if (inode->i_state & I_NEW) { |
181 | struct gfs2_sbd *sdp = GFS2_SB(inode); | |
bba9dfd8 | 182 | inode->i_private = ip; |
bb9bcf06 | 183 | ip->i_no_formal_ino = no_formal_ino; |
b3b94faa | 184 | |
dbb7cae2 | 185 | error = gfs2_glock_get(sdp, no_addr, &gfs2_inode_glops, CREATE, &ip->i_gl); |
feaa7bba SW |
186 | if (unlikely(error)) |
187 | goto fail; | |
188 | ip->i_gl->gl_object = ip; | |
b3b94faa | 189 | |
dbb7cae2 | 190 | error = gfs2_glock_get(sdp, no_addr, &gfs2_iopen_glops, CREATE, &io_gl); |
feaa7bba SW |
191 | if (unlikely(error)) |
192 | goto fail_put; | |
b3b94faa | 193 | |
bfded27b | 194 | set_bit(GIF_INVALID, &ip->i_flags); |
feaa7bba SW |
195 | error = gfs2_glock_nq_init(io_gl, LM_ST_SHARED, GL_EXACT, &ip->i_iopen_gh); |
196 | if (unlikely(error)) | |
197 | goto fail_iopen; | |
d93cfa98 | 198 | ip->i_iopen_gh.gh_gl->gl_object = ip; |
b3b94faa | 199 | |
feaa7bba | 200 | gfs2_glock_put(io_gl); |
c8cdf479 | 201 | |
35dcc52e WC |
202 | if ((type == DT_UNKNOWN) && (no_formal_ino == 0)) |
203 | goto gfs2_nfsbypass; | |
204 | ||
205 | inode->i_mode = DT2IF(type); | |
206 | ||
c8cdf479 SW |
207 | /* |
208 | * We must read the inode in order to work out its type in | |
209 | * this case. Note that this doesn't happen often as we normally | |
210 | * know the type beforehand. This code path only occurs during | |
211 | * unlinked inode recovery (where it is safe to do this glock, | |
212 | * which is not true in the general case). | |
213 | */ | |
c8cdf479 SW |
214 | if (type == DT_UNKNOWN) { |
215 | struct gfs2_holder gh; | |
216 | error = gfs2_glock_nq_init(ip->i_gl, LM_ST_EXCLUSIVE, 0, &gh); | |
217 | if (unlikely(error)) | |
218 | goto fail_glock; | |
219 | /* Inode is now uptodate */ | |
c8cdf479 SW |
220 | gfs2_glock_dq_uninit(&gh); |
221 | } | |
222 | ||
35dcc52e | 223 | gfs2_set_iop(inode); |
feaa7bba | 224 | } |
b3b94faa | 225 | |
35dcc52e | 226 | gfs2_nfsbypass: |
b3b94faa | 227 | return inode; |
c8cdf479 SW |
228 | fail_glock: |
229 | gfs2_glock_dq(&ip->i_iopen_gh); | |
feaa7bba SW |
230 | fail_iopen: |
231 | gfs2_glock_put(io_gl); | |
232 | fail_put: | |
233 | ip->i_gl->gl_object = NULL; | |
234 | gfs2_glock_put(ip->i_gl); | |
235 | fail: | |
236 | iput(inode); | |
237 | return ERR_PTR(error); | |
b3b94faa DT |
238 | } |
239 | ||
af339c02 | 240 | static int gfs2_dinode_in(struct gfs2_inode *ip, const void *buf) |
ea744d01 SW |
241 | { |
242 | struct gfs2_dinode_host *di = &ip->i_di; | |
243 | const struct gfs2_dinode *str = buf; | |
244 | ||
dbb7cae2 | 245 | if (ip->i_no_addr != be64_to_cpu(str->di_num.no_addr)) { |
af339c02 SW |
246 | if (gfs2_consist_inode(ip)) |
247 | gfs2_dinode_print(ip); | |
248 | return -EIO; | |
249 | } | |
dbb7cae2 | 250 | ip->i_no_formal_ino = be64_to_cpu(str->di_num.no_formal_ino); |
b60623c2 | 251 | ip->i_inode.i_mode = be32_to_cpu(str->di_mode); |
e7f14f4d | 252 | ip->i_inode.i_rdev = 0; |
b60623c2 | 253 | switch (ip->i_inode.i_mode & S_IFMT) { |
e7f14f4d SW |
254 | case S_IFBLK: |
255 | case S_IFCHR: | |
256 | ip->i_inode.i_rdev = MKDEV(be32_to_cpu(str->di_major), | |
257 | be32_to_cpu(str->di_minor)); | |
258 | break; | |
259 | }; | |
260 | ||
2933f925 SW |
261 | ip->i_inode.i_uid = be32_to_cpu(str->di_uid); |
262 | ip->i_inode.i_gid = be32_to_cpu(str->di_gid); | |
4f56110a SW |
263 | /* |
264 | * We will need to review setting the nlink count here in the | |
265 | * light of the forthcoming ro bind mount work. This is a reminder | |
266 | * to do that. | |
267 | */ | |
268 | ip->i_inode.i_nlink = be32_to_cpu(str->di_nlink); | |
ea744d01 | 269 | di->di_size = be64_to_cpu(str->di_size); |
9e2dbdac | 270 | i_size_write(&ip->i_inode, di->di_size); |
ea744d01 | 271 | di->di_blocks = be64_to_cpu(str->di_blocks); |
9e2dbdac | 272 | gfs2_set_inode_blocks(&ip->i_inode); |
1a7b1eed | 273 | ip->i_inode.i_atime.tv_sec = be64_to_cpu(str->di_atime); |
4bd91ba1 | 274 | ip->i_inode.i_atime.tv_nsec = be32_to_cpu(str->di_atime_nsec); |
1a7b1eed | 275 | ip->i_inode.i_mtime.tv_sec = be64_to_cpu(str->di_mtime); |
4bd91ba1 | 276 | ip->i_inode.i_mtime.tv_nsec = be32_to_cpu(str->di_mtime_nsec); |
1a7b1eed | 277 | ip->i_inode.i_ctime.tv_sec = be64_to_cpu(str->di_ctime); |
4bd91ba1 | 278 | ip->i_inode.i_ctime.tv_nsec = be32_to_cpu(str->di_ctime_nsec); |
ea744d01 SW |
279 | |
280 | di->di_goal_meta = be64_to_cpu(str->di_goal_meta); | |
281 | di->di_goal_data = be64_to_cpu(str->di_goal_data); | |
282 | di->di_generation = be64_to_cpu(str->di_generation); | |
283 | ||
284 | di->di_flags = be32_to_cpu(str->di_flags); | |
6b124d8d | 285 | gfs2_set_inode_flags(&ip->i_inode); |
ea744d01 SW |
286 | di->di_height = be16_to_cpu(str->di_height); |
287 | ||
288 | di->di_depth = be16_to_cpu(str->di_depth); | |
289 | di->di_entries = be32_to_cpu(str->di_entries); | |
290 | ||
291 | di->di_eattr = be64_to_cpu(str->di_eattr); | |
5561093e SW |
292 | if (S_ISREG(ip->i_inode.i_mode)) |
293 | gfs2_set_aops(&ip->i_inode); | |
294 | ||
af339c02 | 295 | return 0; |
ea744d01 SW |
296 | } |
297 | ||
b3b94faa DT |
298 | /** |
299 | * gfs2_inode_refresh - Refresh the incore copy of the dinode | |
300 | * @ip: The GFS2 inode | |
301 | * | |
302 | * Returns: errno | |
303 | */ | |
304 | ||
305 | int gfs2_inode_refresh(struct gfs2_inode *ip) | |
306 | { | |
307 | struct buffer_head *dibh; | |
308 | int error; | |
309 | ||
310 | error = gfs2_meta_inode_buffer(ip, &dibh); | |
311 | if (error) | |
312 | return error; | |
313 | ||
feaa7bba | 314 | if (gfs2_metatype_check(GFS2_SB(&ip->i_inode), dibh, GFS2_METATYPE_DI)) { |
b3b94faa DT |
315 | brelse(dibh); |
316 | return -EIO; | |
317 | } | |
318 | ||
af339c02 | 319 | error = gfs2_dinode_in(ip, dibh->b_data); |
b3b94faa | 320 | brelse(dibh); |
bfded27b | 321 | clear_bit(GIF_INVALID, &ip->i_flags); |
b3b94faa | 322 | |
af339c02 | 323 | return error; |
b3b94faa DT |
324 | } |
325 | ||
feaa7bba | 326 | int gfs2_dinode_dealloc(struct gfs2_inode *ip) |
b3b94faa | 327 | { |
feaa7bba | 328 | struct gfs2_sbd *sdp = GFS2_SB(&ip->i_inode); |
b3b94faa DT |
329 | struct gfs2_alloc *al; |
330 | struct gfs2_rgrpd *rgd; | |
331 | int error; | |
332 | ||
333 | if (ip->i_di.di_blocks != 1) { | |
334 | if (gfs2_consist_inode(ip)) | |
4cc14f0b | 335 | gfs2_dinode_print(ip); |
b3b94faa DT |
336 | return -EIO; |
337 | } | |
338 | ||
339 | al = gfs2_alloc_get(ip); | |
340 | ||
341 | error = gfs2_quota_hold(ip, NO_QUOTA_CHANGE, NO_QUOTA_CHANGE); | |
342 | if (error) | |
343 | goto out; | |
344 | ||
345 | error = gfs2_rindex_hold(sdp, &al->al_ri_gh); | |
346 | if (error) | |
347 | goto out_qs; | |
348 | ||
dbb7cae2 | 349 | rgd = gfs2_blk2rgrpd(sdp, ip->i_no_addr); |
b3b94faa DT |
350 | if (!rgd) { |
351 | gfs2_consist_inode(ip); | |
352 | error = -EIO; | |
353 | goto out_rindex_relse; | |
354 | } | |
355 | ||
356 | error = gfs2_glock_nq_init(rgd->rd_gl, LM_ST_EXCLUSIVE, 0, | |
357 | &al->al_rgd_gh); | |
358 | if (error) | |
359 | goto out_rindex_relse; | |
360 | ||
420b9e5e | 361 | error = gfs2_trans_begin(sdp, RES_RG_BIT + RES_STATFS + RES_QUOTA, 1); |
b3b94faa DT |
362 | if (error) |
363 | goto out_rg_gunlock; | |
364 | ||
2bcd610d SW |
365 | set_bit(GLF_DIRTY, &ip->i_gl->gl_flags); |
366 | set_bit(GLF_LFLUSH, &ip->i_gl->gl_flags); | |
b3b94faa DT |
367 | |
368 | gfs2_free_di(rgd, ip); | |
369 | ||
b3b94faa DT |
370 | gfs2_trans_end(sdp); |
371 | clear_bit(GLF_STICKY, &ip->i_gl->gl_flags); | |
372 | ||
feaa7bba | 373 | out_rg_gunlock: |
b3b94faa | 374 | gfs2_glock_dq_uninit(&al->al_rgd_gh); |
feaa7bba | 375 | out_rindex_relse: |
b3b94faa | 376 | gfs2_glock_dq_uninit(&al->al_ri_gh); |
feaa7bba | 377 | out_qs: |
b3b94faa | 378 | gfs2_quota_unhold(ip); |
36327521 | 379 | out: |
feaa7bba | 380 | gfs2_alloc_put(ip); |
b3b94faa DT |
381 | return error; |
382 | } | |
383 | ||
b3b94faa | 384 | /** |
87d21e07 | 385 | * gfs2_change_nlink - Change nlink count on inode |
b3b94faa DT |
386 | * @ip: The GFS2 inode |
387 | * @diff: The change in the nlink count required | |
388 | * | |
389 | * Returns: errno | |
390 | */ | |
87d21e07 | 391 | int gfs2_change_nlink(struct gfs2_inode *ip, int diff) |
b3b94faa DT |
392 | { |
393 | struct buffer_head *dibh; | |
cd915493 | 394 | u32 nlink; |
b3b94faa DT |
395 | int error; |
396 | ||
4f56110a SW |
397 | BUG_ON(diff != 1 && diff != -1); |
398 | nlink = ip->i_inode.i_nlink + diff; | |
b3b94faa DT |
399 | |
400 | /* If we are reducing the nlink count, but the new value ends up being | |
401 | bigger than the old one, we must have underflowed. */ | |
4f56110a | 402 | if (diff < 0 && nlink > ip->i_inode.i_nlink) { |
b3b94faa | 403 | if (gfs2_consist_inode(ip)) |
4cc14f0b | 404 | gfs2_dinode_print(ip); |
b3b94faa DT |
405 | return -EIO; |
406 | } | |
407 | ||
408 | error = gfs2_meta_inode_buffer(ip, &dibh); | |
409 | if (error) | |
410 | return error; | |
411 | ||
4f56110a SW |
412 | if (diff > 0) |
413 | inc_nlink(&ip->i_inode); | |
414 | else | |
415 | drop_nlink(&ip->i_inode); | |
416 | ||
4bd91ba1 | 417 | ip->i_inode.i_ctime = CURRENT_TIME; |
b3b94faa | 418 | |
d4e9c4c3 | 419 | gfs2_trans_add_bh(ip->i_gl, dibh, 1); |
539e5d6b | 420 | gfs2_dinode_out(ip, dibh->b_data); |
b3b94faa | 421 | brelse(dibh); |
feaa7bba | 422 | mark_inode_dirty(&ip->i_inode); |
b3b94faa | 423 | |
87d21e07 | 424 | if (ip->i_inode.i_nlink == 0) |
ddee7608 | 425 | gfs2_unlink_di(&ip->i_inode); /* mark inode unlinked */ |
87d21e07 | 426 | |
5509826f WC |
427 | return error; |
428 | } | |
429 | ||
c752666c SW |
430 | struct inode *gfs2_lookup_simple(struct inode *dip, const char *name) |
431 | { | |
432 | struct qstr qstr; | |
6c93fd1e | 433 | struct inode *inode; |
71b86f56 | 434 | gfs2_str2qstr(&qstr, name); |
6c93fd1e RC |
435 | inode = gfs2_lookupi(dip, &qstr, 1, NULL); |
436 | /* gfs2_lookupi has inconsistent callers: vfs | |
437 | * related routines expect NULL for no entry found, | |
438 | * gfs2_lookup_simple callers expect ENOENT | |
439 | * and do not check for NULL. | |
440 | */ | |
441 | if (inode == NULL) | |
442 | return ERR_PTR(-ENOENT); | |
443 | else | |
444 | return inode; | |
c752666c SW |
445 | } |
446 | ||
447 | ||
b3b94faa DT |
448 | /** |
449 | * gfs2_lookupi - Look up a filename in a directory and return its inode | |
450 | * @d_gh: An initialized holder for the directory glock | |
451 | * @name: The name of the inode to look for | |
452 | * @is_root: If 1, ignore the caller's permissions | |
453 | * @i_gh: An uninitialized holder for the new inode glock | |
454 | * | |
d7c103d0 SW |
455 | * This can be called via the VFS filldir function when NFS is doing |
456 | * a readdirplus and the inode which its intending to stat isn't | |
457 | * already in cache. In this case we must not take the directory glock | |
458 | * again, since the readdir call will have already taken that lock. | |
b3b94faa DT |
459 | * |
460 | * Returns: errno | |
461 | */ | |
462 | ||
feaa7bba SW |
463 | struct inode *gfs2_lookupi(struct inode *dir, const struct qstr *name, |
464 | int is_root, struct nameidata *nd) | |
b3b94faa | 465 | { |
c9fd4307 | 466 | struct super_block *sb = dir->i_sb; |
feaa7bba | 467 | struct gfs2_inode *dip = GFS2_I(dir); |
b3b94faa | 468 | struct gfs2_holder d_gh; |
037bcbb7 | 469 | int error = 0; |
c752666c | 470 | struct inode *inode = NULL; |
d7c103d0 | 471 | int unlock = 0; |
b3b94faa DT |
472 | |
473 | if (!name->len || name->len > GFS2_FNAMESIZE) | |
c752666c | 474 | return ERR_PTR(-ENAMETOOLONG); |
b3b94faa | 475 | |
c752666c SW |
476 | if ((name->len == 1 && memcmp(name->name, ".", 1) == 0) || |
477 | (name->len == 2 && memcmp(name->name, "..", 2) == 0 && | |
478 | dir == sb->s_root->d_inode)) { | |
320dd101 SW |
479 | igrab(dir); |
480 | return dir; | |
b3b94faa DT |
481 | } |
482 | ||
d7c103d0 SW |
483 | if (gfs2_glock_is_locked_by_me(dip->i_gl) == 0) { |
484 | error = gfs2_glock_nq_init(dip->i_gl, LM_ST_SHARED, 0, &d_gh); | |
485 | if (error) | |
486 | return ERR_PTR(error); | |
487 | unlock = 1; | |
488 | } | |
b3b94faa DT |
489 | |
490 | if (!is_root) { | |
faf450ef | 491 | error = permission(dir, MAY_EXEC, NULL); |
b3b94faa DT |
492 | if (error) |
493 | goto out; | |
494 | } | |
495 | ||
dbb7cae2 SW |
496 | inode = gfs2_dir_search(dir, name); |
497 | if (IS_ERR(inode)) | |
498 | error = PTR_ERR(inode); | |
7359a19c | 499 | out: |
d7c103d0 SW |
500 | if (unlock) |
501 | gfs2_glock_dq_uninit(&d_gh); | |
c752666c SW |
502 | if (error == -ENOENT) |
503 | return NULL; | |
d7c103d0 | 504 | return inode ? inode : ERR_PTR(error); |
b3b94faa DT |
505 | } |
506 | ||
bb8d8a6f SW |
507 | static void gfs2_inum_range_in(struct gfs2_inum_range_host *ir, const void *buf) |
508 | { | |
509 | const struct gfs2_inum_range *str = buf; | |
510 | ||
511 | ir->ir_start = be64_to_cpu(str->ir_start); | |
512 | ir->ir_length = be64_to_cpu(str->ir_length); | |
513 | } | |
514 | ||
515 | static void gfs2_inum_range_out(const struct gfs2_inum_range_host *ir, void *buf) | |
516 | { | |
517 | struct gfs2_inum_range *str = buf; | |
518 | ||
519 | str->ir_start = cpu_to_be64(ir->ir_start); | |
520 | str->ir_length = cpu_to_be64(ir->ir_length); | |
521 | } | |
522 | ||
cd915493 | 523 | static int pick_formal_ino_1(struct gfs2_sbd *sdp, u64 *formal_ino) |
b3b94faa | 524 | { |
feaa7bba | 525 | struct gfs2_inode *ip = GFS2_I(sdp->sd_ir_inode); |
b3b94faa | 526 | struct buffer_head *bh; |
e6972647 | 527 | struct gfs2_inum_range_host ir; |
b3b94faa DT |
528 | int error; |
529 | ||
530 | error = gfs2_trans_begin(sdp, RES_DINODE, 0); | |
531 | if (error) | |
532 | return error; | |
f55ab26a | 533 | mutex_lock(&sdp->sd_inum_mutex); |
b3b94faa DT |
534 | |
535 | error = gfs2_meta_inode_buffer(ip, &bh); | |
536 | if (error) { | |
f55ab26a | 537 | mutex_unlock(&sdp->sd_inum_mutex); |
b3b94faa DT |
538 | gfs2_trans_end(sdp); |
539 | return error; | |
540 | } | |
541 | ||
542 | gfs2_inum_range_in(&ir, bh->b_data + sizeof(struct gfs2_dinode)); | |
543 | ||
544 | if (ir.ir_length) { | |
545 | *formal_ino = ir.ir_start++; | |
546 | ir.ir_length--; | |
d4e9c4c3 | 547 | gfs2_trans_add_bh(ip->i_gl, bh, 1); |
b3b94faa DT |
548 | gfs2_inum_range_out(&ir, |
549 | bh->b_data + sizeof(struct gfs2_dinode)); | |
550 | brelse(bh); | |
f55ab26a | 551 | mutex_unlock(&sdp->sd_inum_mutex); |
b3b94faa DT |
552 | gfs2_trans_end(sdp); |
553 | return 0; | |
554 | } | |
555 | ||
556 | brelse(bh); | |
557 | ||
f55ab26a | 558 | mutex_unlock(&sdp->sd_inum_mutex); |
b3b94faa DT |
559 | gfs2_trans_end(sdp); |
560 | ||
561 | return 1; | |
562 | } | |
563 | ||
cd915493 | 564 | static int pick_formal_ino_2(struct gfs2_sbd *sdp, u64 *formal_ino) |
b3b94faa | 565 | { |
feaa7bba SW |
566 | struct gfs2_inode *ip = GFS2_I(sdp->sd_ir_inode); |
567 | struct gfs2_inode *m_ip = GFS2_I(sdp->sd_inum_inode); | |
b3b94faa DT |
568 | struct gfs2_holder gh; |
569 | struct buffer_head *bh; | |
e6972647 | 570 | struct gfs2_inum_range_host ir; |
b3b94faa DT |
571 | int error; |
572 | ||
573 | error = gfs2_glock_nq_init(m_ip->i_gl, LM_ST_EXCLUSIVE, 0, &gh); | |
574 | if (error) | |
575 | return error; | |
576 | ||
577 | error = gfs2_trans_begin(sdp, 2 * RES_DINODE, 0); | |
578 | if (error) | |
579 | goto out; | |
f55ab26a | 580 | mutex_lock(&sdp->sd_inum_mutex); |
b3b94faa DT |
581 | |
582 | error = gfs2_meta_inode_buffer(ip, &bh); | |
583 | if (error) | |
584 | goto out_end_trans; | |
907b9bce | 585 | |
b3b94faa DT |
586 | gfs2_inum_range_in(&ir, bh->b_data + sizeof(struct gfs2_dinode)); |
587 | ||
588 | if (!ir.ir_length) { | |
589 | struct buffer_head *m_bh; | |
cd915493 | 590 | u64 x, y; |
b44b84d7 | 591 | __be64 z; |
b3b94faa DT |
592 | |
593 | error = gfs2_meta_inode_buffer(m_ip, &m_bh); | |
594 | if (error) | |
595 | goto out_brelse; | |
596 | ||
b44b84d7 AV |
597 | z = *(__be64 *)(m_bh->b_data + sizeof(struct gfs2_dinode)); |
598 | x = y = be64_to_cpu(z); | |
b3b94faa DT |
599 | ir.ir_start = x; |
600 | ir.ir_length = GFS2_INUM_QUANTUM; | |
601 | x += GFS2_INUM_QUANTUM; | |
602 | if (x < y) | |
603 | gfs2_consist_inode(m_ip); | |
b44b84d7 | 604 | z = cpu_to_be64(x); |
d4e9c4c3 | 605 | gfs2_trans_add_bh(m_ip->i_gl, m_bh, 1); |
b44b84d7 | 606 | *(__be64 *)(m_bh->b_data + sizeof(struct gfs2_dinode)) = z; |
b3b94faa DT |
607 | |
608 | brelse(m_bh); | |
609 | } | |
610 | ||
611 | *formal_ino = ir.ir_start++; | |
612 | ir.ir_length--; | |
613 | ||
d4e9c4c3 | 614 | gfs2_trans_add_bh(ip->i_gl, bh, 1); |
b3b94faa DT |
615 | gfs2_inum_range_out(&ir, bh->b_data + sizeof(struct gfs2_dinode)); |
616 | ||
420b9e5e | 617 | out_brelse: |
b3b94faa | 618 | brelse(bh); |
420b9e5e | 619 | out_end_trans: |
f55ab26a | 620 | mutex_unlock(&sdp->sd_inum_mutex); |
b3b94faa | 621 | gfs2_trans_end(sdp); |
420b9e5e | 622 | out: |
b3b94faa | 623 | gfs2_glock_dq_uninit(&gh); |
b3b94faa DT |
624 | return error; |
625 | } | |
626 | ||
cd915493 | 627 | static int pick_formal_ino(struct gfs2_sbd *sdp, u64 *inum) |
b3b94faa DT |
628 | { |
629 | int error; | |
630 | ||
631 | error = pick_formal_ino_1(sdp, inum); | |
632 | if (error <= 0) | |
633 | return error; | |
634 | ||
635 | error = pick_formal_ino_2(sdp, inum); | |
636 | ||
637 | return error; | |
638 | } | |
639 | ||
640 | /** | |
641 | * create_ok - OK to create a new on-disk inode here? | |
642 | * @dip: Directory in which dinode is to be created | |
643 | * @name: Name of new dinode | |
644 | * @mode: | |
645 | * | |
646 | * Returns: errno | |
647 | */ | |
648 | ||
feaa7bba | 649 | static int create_ok(struct gfs2_inode *dip, const struct qstr *name, |
b3b94faa DT |
650 | unsigned int mode) |
651 | { | |
652 | int error; | |
653 | ||
faf450ef | 654 | error = permission(&dip->i_inode, MAY_WRITE | MAY_EXEC, NULL); |
b3b94faa DT |
655 | if (error) |
656 | return error; | |
657 | ||
658 | /* Don't create entries in an unlinked directory */ | |
4f56110a | 659 | if (!dip->i_inode.i_nlink) |
b3b94faa DT |
660 | return -EPERM; |
661 | ||
dbb7cae2 | 662 | error = gfs2_dir_check(&dip->i_inode, name, NULL); |
b3b94faa DT |
663 | switch (error) { |
664 | case -ENOENT: | |
665 | error = 0; | |
666 | break; | |
667 | case 0: | |
668 | return -EEXIST; | |
669 | default: | |
670 | return error; | |
671 | } | |
672 | ||
cd915493 | 673 | if (dip->i_di.di_entries == (u32)-1) |
b3b94faa | 674 | return -EFBIG; |
4f56110a | 675 | if (S_ISDIR(mode) && dip->i_inode.i_nlink == (u32)-1) |
b3b94faa DT |
676 | return -EMLINK; |
677 | ||
678 | return 0; | |
679 | } | |
680 | ||
681 | static void munge_mode_uid_gid(struct gfs2_inode *dip, unsigned int *mode, | |
682 | unsigned int *uid, unsigned int *gid) | |
683 | { | |
feaa7bba | 684 | if (GFS2_SB(&dip->i_inode)->sd_args.ar_suiddir && |
2933f925 | 685 | (dip->i_inode.i_mode & S_ISUID) && dip->i_inode.i_uid) { |
b3b94faa DT |
686 | if (S_ISDIR(*mode)) |
687 | *mode |= S_ISUID; | |
2933f925 | 688 | else if (dip->i_inode.i_uid != current->fsuid) |
b3b94faa | 689 | *mode &= ~07111; |
2933f925 | 690 | *uid = dip->i_inode.i_uid; |
b3b94faa DT |
691 | } else |
692 | *uid = current->fsuid; | |
693 | ||
b60623c2 | 694 | if (dip->i_inode.i_mode & S_ISGID) { |
b3b94faa DT |
695 | if (S_ISDIR(*mode)) |
696 | *mode |= S_ISGID; | |
2933f925 | 697 | *gid = dip->i_inode.i_gid; |
b3b94faa DT |
698 | } else |
699 | *gid = current->fsgid; | |
700 | } | |
701 | ||
dbb7cae2 | 702 | static int alloc_dinode(struct gfs2_inode *dip, u64 *no_addr, u64 *generation) |
b3b94faa | 703 | { |
feaa7bba | 704 | struct gfs2_sbd *sdp = GFS2_SB(&dip->i_inode); |
b3b94faa DT |
705 | int error; |
706 | ||
707 | gfs2_alloc_get(dip); | |
708 | ||
709 | dip->i_alloc.al_requested = RES_DINODE; | |
710 | error = gfs2_inplace_reserve(dip); | |
711 | if (error) | |
712 | goto out; | |
713 | ||
feaa7bba | 714 | error = gfs2_trans_begin(sdp, RES_RG_BIT + RES_STATFS, 0); |
b3b94faa DT |
715 | if (error) |
716 | goto out_ipreserv; | |
717 | ||
dbb7cae2 | 718 | *no_addr = gfs2_alloc_di(dip, generation); |
b3b94faa DT |
719 | |
720 | gfs2_trans_end(sdp); | |
721 | ||
4340fe62 | 722 | out_ipreserv: |
b3b94faa | 723 | gfs2_inplace_release(dip); |
4340fe62 | 724 | out: |
b3b94faa | 725 | gfs2_alloc_put(dip); |
b3b94faa DT |
726 | return error; |
727 | } | |
728 | ||
729 | /** | |
730 | * init_dinode - Fill in a new dinode structure | |
731 | * @dip: the directory this inode is being created in | |
732 | * @gl: The glock covering the new inode | |
733 | * @inum: the inode number | |
734 | * @mode: the file permissions | |
735 | * @uid: | |
736 | * @gid: | |
737 | * | |
738 | */ | |
739 | ||
740 | static void init_dinode(struct gfs2_inode *dip, struct gfs2_glock *gl, | |
629a21e7 | 741 | const struct gfs2_inum_host *inum, unsigned int mode, |
4340fe62 | 742 | unsigned int uid, unsigned int gid, |
e9bd2b3b | 743 | const u64 *generation, dev_t dev, struct buffer_head **bhp) |
b3b94faa | 744 | { |
feaa7bba | 745 | struct gfs2_sbd *sdp = GFS2_SB(&dip->i_inode); |
b96ca4fa | 746 | struct gfs2_dinode *di; |
b3b94faa | 747 | struct buffer_head *dibh; |
4bd91ba1 | 748 | struct timespec tv = CURRENT_TIME; |
b3b94faa DT |
749 | |
750 | dibh = gfs2_meta_new(gl, inum->no_addr); | |
d4e9c4c3 | 751 | gfs2_trans_add_bh(gl, dibh, 1); |
b3b94faa DT |
752 | gfs2_metatype_set(dibh, GFS2_METATYPE_DI, GFS2_FORMAT_DI); |
753 | gfs2_buffer_clear_tail(dibh, sizeof(struct gfs2_dinode)); | |
b96ca4fa SW |
754 | di = (struct gfs2_dinode *)dibh->b_data; |
755 | ||
2442a098 SW |
756 | di->di_num.no_formal_ino = cpu_to_be64(inum->no_formal_ino); |
757 | di->di_num.no_addr = cpu_to_be64(inum->no_addr); | |
b96ca4fa SW |
758 | di->di_mode = cpu_to_be32(mode); |
759 | di->di_uid = cpu_to_be32(uid); | |
760 | di->di_gid = cpu_to_be32(gid); | |
294caaa3 SW |
761 | di->di_nlink = 0; |
762 | di->di_size = 0; | |
b96ca4fa | 763 | di->di_blocks = cpu_to_be64(1); |
4bd91ba1 | 764 | di->di_atime = di->di_mtime = di->di_ctime = cpu_to_be64(tv.tv_sec); |
e7f14f4d SW |
765 | di->di_major = cpu_to_be32(MAJOR(dev)); |
766 | di->di_minor = cpu_to_be32(MINOR(dev)); | |
b96ca4fa | 767 | di->di_goal_meta = di->di_goal_data = cpu_to_be64(inum->no_addr); |
4340fe62 | 768 | di->di_generation = cpu_to_be64(*generation); |
294caaa3 | 769 | di->di_flags = 0; |
b3b94faa DT |
770 | |
771 | if (S_ISREG(mode)) { | |
772 | if ((dip->i_di.di_flags & GFS2_DIF_INHERIT_JDATA) || | |
773 | gfs2_tune_get(sdp, gt_new_files_jdata)) | |
b96ca4fa | 774 | di->di_flags |= cpu_to_be32(GFS2_DIF_JDATA); |
b3b94faa DT |
775 | if ((dip->i_di.di_flags & GFS2_DIF_INHERIT_DIRECTIO) || |
776 | gfs2_tune_get(sdp, gt_new_files_directio)) | |
b96ca4fa | 777 | di->di_flags |= cpu_to_be32(GFS2_DIF_DIRECTIO); |
b3b94faa | 778 | } else if (S_ISDIR(mode)) { |
568f4c96 SW |
779 | di->di_flags |= cpu_to_be32(dip->i_di.di_flags & |
780 | GFS2_DIF_INHERIT_DIRECTIO); | |
781 | di->di_flags |= cpu_to_be32(dip->i_di.di_flags & | |
782 | GFS2_DIF_INHERIT_JDATA); | |
b3b94faa DT |
783 | } |
784 | ||
b96ca4fa | 785 | di->__pad1 = 0; |
a9583c79 | 786 | di->di_payload_format = cpu_to_be32(S_ISDIR(mode) ? GFS2_FORMAT_DE : 0); |
294caaa3 | 787 | di->di_height = 0; |
b96ca4fa SW |
788 | di->__pad2 = 0; |
789 | di->__pad3 = 0; | |
294caaa3 SW |
790 | di->di_depth = 0; |
791 | di->di_entries = 0; | |
b96ca4fa | 792 | memset(&di->__pad4, 0, sizeof(di->__pad4)); |
294caaa3 | 793 | di->di_eattr = 0; |
4bd91ba1 SW |
794 | di->di_atime_nsec = cpu_to_be32(tv.tv_nsec); |
795 | di->di_mtime_nsec = cpu_to_be32(tv.tv_nsec); | |
796 | di->di_ctime_nsec = cpu_to_be32(tv.tv_nsec); | |
b96ca4fa | 797 | memset(&di->di_reserved, 0, sizeof(di->di_reserved)); |
e9bd2b3b WC |
798 | |
799 | set_buffer_uptodate(dibh); | |
b96ca4fa | 800 | |
e9bd2b3b | 801 | *bhp = dibh; |
b3b94faa DT |
802 | } |
803 | ||
804 | static int make_dinode(struct gfs2_inode *dip, struct gfs2_glock *gl, | |
629a21e7 | 805 | unsigned int mode, const struct gfs2_inum_host *inum, |
e9bd2b3b | 806 | const u64 *generation, dev_t dev, struct buffer_head **bhp) |
b3b94faa | 807 | { |
feaa7bba | 808 | struct gfs2_sbd *sdp = GFS2_SB(&dip->i_inode); |
b3b94faa DT |
809 | unsigned int uid, gid; |
810 | int error; | |
811 | ||
812 | munge_mode_uid_gid(dip, &mode, &uid, &gid); | |
b3b94faa DT |
813 | gfs2_alloc_get(dip); |
814 | ||
815 | error = gfs2_quota_lock(dip, uid, gid); | |
816 | if (error) | |
817 | goto out; | |
818 | ||
819 | error = gfs2_quota_check(dip, uid, gid); | |
820 | if (error) | |
821 | goto out_quota; | |
822 | ||
feaa7bba | 823 | error = gfs2_trans_begin(sdp, RES_DINODE + RES_QUOTA, 0); |
b3b94faa DT |
824 | if (error) |
825 | goto out_quota; | |
826 | ||
e9bd2b3b | 827 | init_dinode(dip, gl, inum, mode, uid, gid, generation, dev, bhp); |
b3b94faa | 828 | gfs2_quota_change(dip, +1, uid, gid); |
b3b94faa DT |
829 | gfs2_trans_end(sdp); |
830 | ||
feaa7bba | 831 | out_quota: |
b3b94faa | 832 | gfs2_quota_unlock(dip); |
feaa7bba | 833 | out: |
b3b94faa | 834 | gfs2_alloc_put(dip); |
b3b94faa DT |
835 | return error; |
836 | } | |
837 | ||
feaa7bba SW |
838 | static int link_dinode(struct gfs2_inode *dip, const struct qstr *name, |
839 | struct gfs2_inode *ip) | |
b3b94faa | 840 | { |
feaa7bba | 841 | struct gfs2_sbd *sdp = GFS2_SB(&dip->i_inode); |
b3b94faa DT |
842 | struct gfs2_alloc *al; |
843 | int alloc_required; | |
844 | struct buffer_head *dibh; | |
845 | int error; | |
846 | ||
847 | al = gfs2_alloc_get(dip); | |
848 | ||
849 | error = gfs2_quota_lock(dip, NO_QUOTA_CHANGE, NO_QUOTA_CHANGE); | |
850 | if (error) | |
851 | goto fail; | |
852 | ||
feaa7bba | 853 | error = alloc_required = gfs2_diradd_alloc_required(&dip->i_inode, name); |
c752666c SW |
854 | if (alloc_required < 0) |
855 | goto fail; | |
b3b94faa | 856 | if (alloc_required) { |
2933f925 | 857 | error = gfs2_quota_check(dip, dip->i_inode.i_uid, dip->i_inode.i_gid); |
b3b94faa DT |
858 | if (error) |
859 | goto fail_quota_locks; | |
860 | ||
861 | al->al_requested = sdp->sd_max_dirres; | |
862 | ||
863 | error = gfs2_inplace_reserve(dip); | |
864 | if (error) | |
865 | goto fail_quota_locks; | |
866 | ||
320dd101 | 867 | error = gfs2_trans_begin(sdp, sdp->sd_max_dirres + |
bb8d8a6f | 868 | al->al_rgd->rd_length + |
907b9bce | 869 | 2 * RES_DINODE + |
b3b94faa DT |
870 | RES_STATFS + RES_QUOTA, 0); |
871 | if (error) | |
872 | goto fail_ipreserv; | |
873 | } else { | |
feaa7bba | 874 | error = gfs2_trans_begin(sdp, RES_LEAF + 2 * RES_DINODE, 0); |
b3b94faa DT |
875 | if (error) |
876 | goto fail_quota_locks; | |
877 | } | |
878 | ||
dbb7cae2 | 879 | error = gfs2_dir_add(&dip->i_inode, name, ip, IF2DT(ip->i_inode.i_mode)); |
b3b94faa DT |
880 | if (error) |
881 | goto fail_end_trans; | |
882 | ||
883 | error = gfs2_meta_inode_buffer(ip, &dibh); | |
884 | if (error) | |
885 | goto fail_end_trans; | |
4f56110a | 886 | ip->i_inode.i_nlink = 1; |
d4e9c4c3 | 887 | gfs2_trans_add_bh(ip->i_gl, dibh, 1); |
539e5d6b | 888 | gfs2_dinode_out(ip, dibh->b_data); |
b3b94faa | 889 | brelse(dibh); |
b3b94faa DT |
890 | return 0; |
891 | ||
320dd101 | 892 | fail_end_trans: |
b3b94faa DT |
893 | gfs2_trans_end(sdp); |
894 | ||
320dd101 | 895 | fail_ipreserv: |
b3b94faa DT |
896 | if (dip->i_alloc.al_rgd) |
897 | gfs2_inplace_release(dip); | |
898 | ||
320dd101 | 899 | fail_quota_locks: |
b3b94faa DT |
900 | gfs2_quota_unlock(dip); |
901 | ||
320dd101 | 902 | fail: |
b3b94faa | 903 | gfs2_alloc_put(dip); |
b3b94faa DT |
904 | return error; |
905 | } | |
906 | ||
fcb47e0b RH |
907 | static int gfs2_security_init(struct gfs2_inode *dip, struct gfs2_inode *ip) |
908 | { | |
909 | int err; | |
910 | size_t len; | |
911 | void *value; | |
912 | char *name; | |
913 | struct gfs2_ea_request er; | |
914 | ||
915 | err = security_inode_init_security(&ip->i_inode, &dip->i_inode, | |
916 | &name, &value, &len); | |
917 | ||
918 | if (err) { | |
919 | if (err == -EOPNOTSUPP) | |
920 | return 0; | |
921 | return err; | |
922 | } | |
923 | ||
924 | memset(&er, 0, sizeof(struct gfs2_ea_request)); | |
925 | ||
926 | er.er_type = GFS2_EATYPE_SECURITY; | |
927 | er.er_name = name; | |
928 | er.er_data = value; | |
929 | er.er_name_len = strlen(name); | |
930 | er.er_data_len = len; | |
931 | ||
932 | err = gfs2_ea_set_i(ip, &er); | |
933 | ||
934 | kfree(value); | |
935 | kfree(name); | |
936 | ||
937 | return err; | |
938 | } | |
939 | ||
b3b94faa DT |
940 | /** |
941 | * gfs2_createi - Create a new inode | |
942 | * @ghs: An array of two holders | |
943 | * @name: The name of the new file | |
944 | * @mode: the permissions on the new inode | |
945 | * | |
946 | * @ghs[0] is an initialized holder for the directory | |
947 | * @ghs[1] is the holder for the inode lock | |
948 | * | |
7359a19c | 949 | * If the return value is not NULL, the glocks on both the directory and the new |
b3b94faa DT |
950 | * file are held. A transaction has been started and an inplace reservation |
951 | * is held, as well. | |
952 | * | |
7359a19c | 953 | * Returns: An inode |
b3b94faa DT |
954 | */ |
955 | ||
feaa7bba | 956 | struct inode *gfs2_createi(struct gfs2_holder *ghs, const struct qstr *name, |
e7f14f4d | 957 | unsigned int mode, dev_t dev) |
b3b94faa | 958 | { |
e1cc8603 | 959 | struct inode *inode = NULL; |
5c676f6d | 960 | struct gfs2_inode *dip = ghs->gh_gl->gl_object; |
feaa7bba SW |
961 | struct inode *dir = &dip->i_inode; |
962 | struct gfs2_sbd *sdp = GFS2_SB(&dip->i_inode); | |
dbb7cae2 | 963 | struct gfs2_inum_host inum = { .no_addr = 0, .no_formal_ino = 0 }; |
b3b94faa | 964 | int error; |
4340fe62 | 965 | u64 generation; |
f91a0d3e | 966 | struct buffer_head *bh = NULL; |
b3b94faa DT |
967 | |
968 | if (!name->len || name->len > GFS2_FNAMESIZE) | |
7359a19c | 969 | return ERR_PTR(-ENAMETOOLONG); |
b3b94faa | 970 | |
b3b94faa DT |
971 | gfs2_holder_reinit(LM_ST_EXCLUSIVE, 0, ghs); |
972 | error = gfs2_glock_nq(ghs); | |
973 | if (error) | |
974 | goto fail; | |
975 | ||
976 | error = create_ok(dip, name, mode); | |
977 | if (error) | |
978 | goto fail_gunlock; | |
979 | ||
feaa7bba | 980 | error = pick_formal_ino(sdp, &inum.no_formal_ino); |
b3b94faa DT |
981 | if (error) |
982 | goto fail_gunlock; | |
983 | ||
dbb7cae2 | 984 | error = alloc_dinode(dip, &inum.no_addr, &generation); |
b3b94faa DT |
985 | if (error) |
986 | goto fail_gunlock; | |
987 | ||
28626e20 SW |
988 | error = gfs2_glock_nq_num(sdp, inum.no_addr, &gfs2_inode_glops, |
989 | LM_ST_EXCLUSIVE, GL_SKIP, ghs + 1); | |
990 | if (error) | |
991 | goto fail_gunlock; | |
b3b94faa | 992 | |
e9bd2b3b | 993 | error = make_dinode(dip, ghs[1].gh_gl, mode, &inum, &generation, dev, &bh); |
b3b94faa DT |
994 | if (error) |
995 | goto fail_gunlock2; | |
996 | ||
bb9bcf06 WC |
997 | inode = gfs2_inode_lookup(dir->i_sb, IF2DT(mode), |
998 | inum.no_addr, | |
7a9f53b3 | 999 | inum.no_formal_ino, 0); |
feaa7bba | 1000 | if (IS_ERR(inode)) |
b3b94faa DT |
1001 | goto fail_gunlock2; |
1002 | ||
feaa7bba | 1003 | error = gfs2_inode_refresh(GFS2_I(inode)); |
b3b94faa | 1004 | if (error) |
e1cc8603 | 1005 | goto fail_gunlock2; |
b3b94faa | 1006 | |
feaa7bba | 1007 | error = gfs2_acl_create(dip, GFS2_I(inode)); |
b3b94faa | 1008 | if (error) |
e1cc8603 | 1009 | goto fail_gunlock2; |
b3b94faa | 1010 | |
fcb47e0b RH |
1011 | error = gfs2_security_init(dip, GFS2_I(inode)); |
1012 | if (error) | |
e1cc8603 | 1013 | goto fail_gunlock2; |
fcb47e0b | 1014 | |
feaa7bba | 1015 | error = link_dinode(dip, name, GFS2_I(inode)); |
b3b94faa | 1016 | if (error) |
e1cc8603 | 1017 | goto fail_gunlock2; |
b3b94faa | 1018 | |
f91a0d3e SW |
1019 | if (bh) |
1020 | brelse(bh); | |
7359a19c SW |
1021 | if (!inode) |
1022 | return ERR_PTR(-ENOMEM); | |
1023 | return inode; | |
b3b94faa | 1024 | |
320dd101 | 1025 | fail_gunlock2: |
b3b94faa | 1026 | gfs2_glock_dq_uninit(ghs + 1); |
e1cc8603 SW |
1027 | if (inode) |
1028 | iput(inode); | |
320dd101 | 1029 | fail_gunlock: |
b3b94faa | 1030 | gfs2_glock_dq(ghs); |
320dd101 | 1031 | fail: |
f91a0d3e SW |
1032 | if (bh) |
1033 | brelse(bh); | |
7359a19c | 1034 | return ERR_PTR(error); |
b3b94faa DT |
1035 | } |
1036 | ||
b3b94faa DT |
1037 | /** |
1038 | * gfs2_rmdiri - Remove a directory | |
1039 | * @dip: The parent directory of the directory to be removed | |
1040 | * @name: The name of the directory to be removed | |
1041 | * @ip: The GFS2 inode of the directory to be removed | |
1042 | * | |
1043 | * Assumes Glocks on dip and ip are held | |
1044 | * | |
1045 | * Returns: errno | |
1046 | */ | |
1047 | ||
feaa7bba SW |
1048 | int gfs2_rmdiri(struct gfs2_inode *dip, const struct qstr *name, |
1049 | struct gfs2_inode *ip) | |
b3b94faa | 1050 | { |
b3b94faa DT |
1051 | struct qstr dotname; |
1052 | int error; | |
1053 | ||
1054 | if (ip->i_di.di_entries != 2) { | |
1055 | if (gfs2_consist_inode(ip)) | |
4cc14f0b | 1056 | gfs2_dinode_print(ip); |
b3b94faa DT |
1057 | return -EIO; |
1058 | } | |
1059 | ||
1060 | error = gfs2_dir_del(dip, name); | |
1061 | if (error) | |
1062 | return error; | |
1063 | ||
1064 | error = gfs2_change_nlink(dip, -1); | |
1065 | if (error) | |
1066 | return error; | |
1067 | ||
71b86f56 | 1068 | gfs2_str2qstr(&dotname, "."); |
b3b94faa DT |
1069 | error = gfs2_dir_del(ip, &dotname); |
1070 | if (error) | |
1071 | return error; | |
1072 | ||
feaa7bba | 1073 | gfs2_str2qstr(&dotname, ".."); |
b3b94faa DT |
1074 | error = gfs2_dir_del(ip, &dotname); |
1075 | if (error) | |
1076 | return error; | |
1077 | ||
4f56110a SW |
1078 | /* It looks odd, but it really should be done twice */ |
1079 | error = gfs2_change_nlink(ip, -1); | |
1080 | if (error) | |
1081 | return error; | |
1082 | ||
1083 | error = gfs2_change_nlink(ip, -1); | |
b3b94faa DT |
1084 | if (error) |
1085 | return error; | |
1086 | ||
b3b94faa DT |
1087 | return error; |
1088 | } | |
1089 | ||
1090 | /* | |
1091 | * gfs2_unlink_ok - check to see that a inode is still in a directory | |
1092 | * @dip: the directory | |
1093 | * @name: the name of the file | |
1094 | * @ip: the inode | |
1095 | * | |
1096 | * Assumes that the lock on (at least) @dip is held. | |
1097 | * | |
1098 | * Returns: 0 if the parent/child relationship is correct, errno if it isn't | |
1099 | */ | |
1100 | ||
feaa7bba | 1101 | int gfs2_unlink_ok(struct gfs2_inode *dip, const struct qstr *name, |
dbb7cae2 | 1102 | const struct gfs2_inode *ip) |
b3b94faa | 1103 | { |
b3b94faa DT |
1104 | int error; |
1105 | ||
feaa7bba | 1106 | if (IS_IMMUTABLE(&ip->i_inode) || IS_APPEND(&ip->i_inode)) |
b3b94faa DT |
1107 | return -EPERM; |
1108 | ||
b60623c2 | 1109 | if ((dip->i_inode.i_mode & S_ISVTX) && |
2933f925 SW |
1110 | dip->i_inode.i_uid != current->fsuid && |
1111 | ip->i_inode.i_uid != current->fsuid && !capable(CAP_FOWNER)) | |
b3b94faa DT |
1112 | return -EPERM; |
1113 | ||
feaa7bba | 1114 | if (IS_APPEND(&dip->i_inode)) |
b3b94faa DT |
1115 | return -EPERM; |
1116 | ||
faf450ef | 1117 | error = permission(&dip->i_inode, MAY_WRITE | MAY_EXEC, NULL); |
b3b94faa DT |
1118 | if (error) |
1119 | return error; | |
1120 | ||
dbb7cae2 | 1121 | error = gfs2_dir_check(&dip->i_inode, name, ip); |
b3b94faa DT |
1122 | if (error) |
1123 | return error; | |
1124 | ||
b3b94faa DT |
1125 | return 0; |
1126 | } | |
1127 | ||
1128 | /* | |
1129 | * gfs2_ok_to_move - check if it's ok to move a directory to another directory | |
1130 | * @this: move this | |
1131 | * @to: to here | |
1132 | * | |
1133 | * Follow @to back to the root and make sure we don't encounter @this | |
1134 | * Assumes we already hold the rename lock. | |
1135 | * | |
1136 | * Returns: errno | |
1137 | */ | |
1138 | ||
1139 | int gfs2_ok_to_move(struct gfs2_inode *this, struct gfs2_inode *to) | |
1140 | { | |
feaa7bba | 1141 | struct inode *dir = &to->i_inode; |
c9fd4307 | 1142 | struct super_block *sb = dir->i_sb; |
7359a19c | 1143 | struct inode *tmp; |
b3b94faa DT |
1144 | struct qstr dotdot; |
1145 | int error = 0; | |
1146 | ||
71b86f56 | 1147 | gfs2_str2qstr(&dotdot, ".."); |
b3b94faa | 1148 | |
7359a19c | 1149 | igrab(dir); |
b3b94faa DT |
1150 | |
1151 | for (;;) { | |
feaa7bba | 1152 | if (dir == &this->i_inode) { |
b3b94faa DT |
1153 | error = -EINVAL; |
1154 | break; | |
1155 | } | |
c9fd4307 | 1156 | if (dir == sb->s_root->d_inode) { |
b3b94faa DT |
1157 | error = 0; |
1158 | break; | |
1159 | } | |
1160 | ||
c752666c SW |
1161 | tmp = gfs2_lookupi(dir, &dotdot, 1, NULL); |
1162 | if (IS_ERR(tmp)) { | |
1163 | error = PTR_ERR(tmp); | |
b3b94faa | 1164 | break; |
c752666c | 1165 | } |
b3b94faa | 1166 | |
7359a19c SW |
1167 | iput(dir); |
1168 | dir = tmp; | |
b3b94faa DT |
1169 | } |
1170 | ||
7359a19c | 1171 | iput(dir); |
b3b94faa DT |
1172 | |
1173 | return error; | |
1174 | } | |
1175 | ||
1176 | /** | |
1177 | * gfs2_readlinki - return the contents of a symlink | |
1178 | * @ip: the symlink's inode | |
1179 | * @buf: a pointer to the buffer to be filled | |
1180 | * @len: a pointer to the length of @buf | |
1181 | * | |
1182 | * If @buf is too small, a piece of memory is kmalloc()ed and needs | |
1183 | * to be freed by the caller. | |
1184 | * | |
1185 | * Returns: errno | |
1186 | */ | |
1187 | ||
1188 | int gfs2_readlinki(struct gfs2_inode *ip, char **buf, unsigned int *len) | |
1189 | { | |
1190 | struct gfs2_holder i_gh; | |
1191 | struct buffer_head *dibh; | |
1192 | unsigned int x; | |
1193 | int error; | |
1194 | ||
1195 | gfs2_holder_init(ip->i_gl, LM_ST_SHARED, GL_ATIME, &i_gh); | |
1196 | error = gfs2_glock_nq_atime(&i_gh); | |
1197 | if (error) { | |
1198 | gfs2_holder_uninit(&i_gh); | |
1199 | return error; | |
1200 | } | |
1201 | ||
1202 | if (!ip->i_di.di_size) { | |
1203 | gfs2_consist_inode(ip); | |
1204 | error = -EIO; | |
1205 | goto out; | |
1206 | } | |
1207 | ||
1208 | error = gfs2_meta_inode_buffer(ip, &dibh); | |
1209 | if (error) | |
1210 | goto out; | |
1211 | ||
1212 | x = ip->i_di.di_size + 1; | |
1213 | if (x > *len) { | |
1214 | *buf = kmalloc(x, GFP_KERNEL); | |
1215 | if (!*buf) { | |
1216 | error = -ENOMEM; | |
1217 | goto out_brelse; | |
1218 | } | |
1219 | } | |
1220 | ||
1221 | memcpy(*buf, dibh->b_data + sizeof(struct gfs2_dinode), x); | |
1222 | *len = x; | |
1223 | ||
feaa7bba | 1224 | out_brelse: |
b3b94faa | 1225 | brelse(dibh); |
feaa7bba | 1226 | out: |
b3b94faa | 1227 | gfs2_glock_dq_uninit(&i_gh); |
b3b94faa DT |
1228 | return error; |
1229 | } | |
1230 | ||
1231 | /** | |
1232 | * gfs2_glock_nq_atime - Acquire a hold on an inode's glock, and | |
1233 | * conditionally update the inode's atime | |
1234 | * @gh: the holder to acquire | |
1235 | * | |
1236 | * Tests atime (access time) for gfs2_read, gfs2_readdir and gfs2_mmap | |
1237 | * Update if the difference between the current time and the inode's current | |
1238 | * atime is greater than an interval specified at mount. | |
1239 | * | |
1240 | * Returns: errno | |
1241 | */ | |
1242 | ||
1243 | int gfs2_glock_nq_atime(struct gfs2_holder *gh) | |
1244 | { | |
1245 | struct gfs2_glock *gl = gh->gh_gl; | |
1246 | struct gfs2_sbd *sdp = gl->gl_sbd; | |
5c676f6d | 1247 | struct gfs2_inode *ip = gl->gl_object; |
4bd91ba1 | 1248 | s64 quantum = gfs2_tune_get(sdp, gt_atime_quantum); |
b3b94faa DT |
1249 | unsigned int state; |
1250 | int flags; | |
1251 | int error; | |
4bd91ba1 | 1252 | struct timespec tv = CURRENT_TIME; |
b3b94faa DT |
1253 | |
1254 | if (gfs2_assert_warn(sdp, gh->gh_flags & GL_ATIME) || | |
1255 | gfs2_assert_warn(sdp, !(gh->gh_flags & GL_ASYNC)) || | |
1256 | gfs2_assert_warn(sdp, gl->gl_ops == &gfs2_inode_glops)) | |
1257 | return -EINVAL; | |
1258 | ||
1259 | state = gh->gh_state; | |
1260 | flags = gh->gh_flags; | |
1261 | ||
1262 | error = gfs2_glock_nq(gh); | |
1263 | if (error) | |
1264 | return error; | |
1265 | ||
1266 | if (test_bit(SDF_NOATIME, &sdp->sd_flags) || | |
1267 | (sdp->sd_vfs->s_flags & MS_RDONLY)) | |
1268 | return 0; | |
1269 | ||
4bd91ba1 | 1270 | if (tv.tv_sec - ip->i_inode.i_atime.tv_sec >= quantum) { |
b3b94faa | 1271 | gfs2_glock_dq(gh); |
fd88de56 SW |
1272 | gfs2_holder_reinit(LM_ST_EXCLUSIVE, gh->gh_flags & ~LM_FLAG_ANY, |
1273 | gh); | |
b3b94faa DT |
1274 | error = gfs2_glock_nq(gh); |
1275 | if (error) | |
1276 | return error; | |
1277 | ||
1278 | /* Verify that atime hasn't been updated while we were | |
1279 | trying to get exclusive lock. */ | |
1280 | ||
4bd91ba1 SW |
1281 | tv = CURRENT_TIME; |
1282 | if (tv.tv_sec - ip->i_inode.i_atime.tv_sec >= quantum) { | |
b3b94faa | 1283 | struct buffer_head *dibh; |
48516ced | 1284 | struct gfs2_dinode *di; |
b3b94faa DT |
1285 | |
1286 | error = gfs2_trans_begin(sdp, RES_DINODE, 0); | |
1287 | if (error == -EROFS) | |
1288 | return 0; | |
1289 | if (error) | |
1290 | goto fail; | |
1291 | ||
1292 | error = gfs2_meta_inode_buffer(ip, &dibh); | |
1293 | if (error) | |
1294 | goto fail_end_trans; | |
1295 | ||
4bd91ba1 | 1296 | ip->i_inode.i_atime = tv; |
b3b94faa | 1297 | |
d4e9c4c3 | 1298 | gfs2_trans_add_bh(ip->i_gl, dibh, 1); |
48516ced | 1299 | di = (struct gfs2_dinode *)dibh->b_data; |
1a7b1eed | 1300 | di->di_atime = cpu_to_be64(ip->i_inode.i_atime.tv_sec); |
4bd91ba1 | 1301 | di->di_atime_nsec = cpu_to_be32(ip->i_inode.i_atime.tv_nsec); |
b3b94faa DT |
1302 | brelse(dibh); |
1303 | ||
1304 | gfs2_trans_end(sdp); | |
1305 | } | |
1306 | ||
1307 | /* If someone else has asked for the glock, | |
1308 | unlock and let them have it. Then reacquire | |
1309 | in the original state. */ | |
1310 | if (gfs2_glock_is_blocking(gl)) { | |
1311 | gfs2_glock_dq(gh); | |
1312 | gfs2_holder_reinit(state, flags, gh); | |
1313 | return gfs2_glock_nq(gh); | |
1314 | } | |
1315 | } | |
1316 | ||
1317 | return 0; | |
1318 | ||
feaa7bba | 1319 | fail_end_trans: |
b3b94faa | 1320 | gfs2_trans_end(sdp); |
feaa7bba | 1321 | fail: |
b3b94faa | 1322 | gfs2_glock_dq(gh); |
b3b94faa DT |
1323 | return error; |
1324 | } | |
1325 | ||
b3b94faa DT |
1326 | static int |
1327 | __gfs2_setattr_simple(struct gfs2_inode *ip, struct iattr *attr) | |
1328 | { | |
1329 | struct buffer_head *dibh; | |
1330 | int error; | |
1331 | ||
1332 | error = gfs2_meta_inode_buffer(ip, &dibh); | |
1333 | if (!error) { | |
feaa7bba SW |
1334 | error = inode_setattr(&ip->i_inode, attr); |
1335 | gfs2_assert_warn(GFS2_SB(&ip->i_inode), !error); | |
d4e9c4c3 | 1336 | gfs2_trans_add_bh(ip->i_gl, dibh, 1); |
539e5d6b | 1337 | gfs2_dinode_out(ip, dibh->b_data); |
b3b94faa DT |
1338 | brelse(dibh); |
1339 | } | |
1340 | return error; | |
1341 | } | |
1342 | ||
1343 | /** | |
1344 | * gfs2_setattr_simple - | |
1345 | * @ip: | |
1346 | * @attr: | |
1347 | * | |
1348 | * Called with a reference on the vnode. | |
1349 | * | |
1350 | * Returns: errno | |
1351 | */ | |
1352 | ||
1353 | int gfs2_setattr_simple(struct gfs2_inode *ip, struct iattr *attr) | |
1354 | { | |
1355 | int error; | |
1356 | ||
5c676f6d | 1357 | if (current->journal_info) |
b3b94faa DT |
1358 | return __gfs2_setattr_simple(ip, attr); |
1359 | ||
feaa7bba | 1360 | error = gfs2_trans_begin(GFS2_SB(&ip->i_inode), RES_DINODE, 0); |
b3b94faa DT |
1361 | if (error) |
1362 | return error; | |
1363 | ||
1364 | error = __gfs2_setattr_simple(ip, attr); | |
feaa7bba | 1365 | gfs2_trans_end(GFS2_SB(&ip->i_inode)); |
b3b94faa DT |
1366 | return error; |
1367 | } | |
1368 | ||
bb8d8a6f SW |
1369 | void gfs2_dinode_out(const struct gfs2_inode *ip, void *buf) |
1370 | { | |
1371 | const struct gfs2_dinode_host *di = &ip->i_di; | |
1372 | struct gfs2_dinode *str = buf; | |
1373 | ||
1374 | str->di_header.mh_magic = cpu_to_be32(GFS2_MAGIC); | |
1375 | str->di_header.mh_type = cpu_to_be32(GFS2_METATYPE_DI); | |
1376 | str->di_header.__pad0 = 0; | |
1377 | str->di_header.mh_format = cpu_to_be32(GFS2_FORMAT_DI); | |
1378 | str->di_header.__pad1 = 0; | |
1379 | str->di_num.no_addr = cpu_to_be64(ip->i_no_addr); | |
1380 | str->di_num.no_formal_ino = cpu_to_be64(ip->i_no_formal_ino); | |
1381 | str->di_mode = cpu_to_be32(ip->i_inode.i_mode); | |
1382 | str->di_uid = cpu_to_be32(ip->i_inode.i_uid); | |
1383 | str->di_gid = cpu_to_be32(ip->i_inode.i_gid); | |
1384 | str->di_nlink = cpu_to_be32(ip->i_inode.i_nlink); | |
1385 | str->di_size = cpu_to_be64(di->di_size); | |
1386 | str->di_blocks = cpu_to_be64(di->di_blocks); | |
1387 | str->di_atime = cpu_to_be64(ip->i_inode.i_atime.tv_sec); | |
1388 | str->di_mtime = cpu_to_be64(ip->i_inode.i_mtime.tv_sec); | |
1389 | str->di_ctime = cpu_to_be64(ip->i_inode.i_ctime.tv_sec); | |
1390 | ||
1391 | str->di_goal_meta = cpu_to_be64(di->di_goal_meta); | |
1392 | str->di_goal_data = cpu_to_be64(di->di_goal_data); | |
1393 | str->di_generation = cpu_to_be64(di->di_generation); | |
1394 | ||
1395 | str->di_flags = cpu_to_be32(di->di_flags); | |
1396 | str->di_height = cpu_to_be16(di->di_height); | |
1397 | str->di_payload_format = cpu_to_be32(S_ISDIR(ip->i_inode.i_mode) && | |
1398 | !(ip->i_di.di_flags & GFS2_DIF_EXHASH) ? | |
1399 | GFS2_FORMAT_DE : 0); | |
1400 | str->di_depth = cpu_to_be16(di->di_depth); | |
1401 | str->di_entries = cpu_to_be32(di->di_entries); | |
1402 | ||
1403 | str->di_eattr = cpu_to_be64(di->di_eattr); | |
4bd91ba1 SW |
1404 | str->di_atime_nsec = cpu_to_be32(ip->i_inode.i_atime.tv_nsec); |
1405 | str->di_mtime_nsec = cpu_to_be32(ip->i_inode.i_mtime.tv_nsec); | |
1406 | str->di_ctime_nsec = cpu_to_be32(ip->i_inode.i_ctime.tv_nsec); | |
bb8d8a6f SW |
1407 | } |
1408 | ||
1409 | void gfs2_dinode_print(const struct gfs2_inode *ip) | |
1410 | { | |
1411 | const struct gfs2_dinode_host *di = &ip->i_di; | |
1412 | ||
1413 | printk(KERN_INFO " no_formal_ino = %llu\n", | |
1414 | (unsigned long long)ip->i_no_formal_ino); | |
1415 | printk(KERN_INFO " no_addr = %llu\n", | |
1416 | (unsigned long long)ip->i_no_addr); | |
1417 | printk(KERN_INFO " di_size = %llu\n", (unsigned long long)di->di_size); | |
1418 | printk(KERN_INFO " di_blocks = %llu\n", | |
1419 | (unsigned long long)di->di_blocks); | |
1420 | printk(KERN_INFO " di_goal_meta = %llu\n", | |
1421 | (unsigned long long)di->di_goal_meta); | |
1422 | printk(KERN_INFO " di_goal_data = %llu\n", | |
1423 | (unsigned long long)di->di_goal_data); | |
1424 | printk(KERN_INFO " di_flags = 0x%.8X\n", di->di_flags); | |
1425 | printk(KERN_INFO " di_height = %u\n", di->di_height); | |
1426 | printk(KERN_INFO " di_depth = %u\n", di->di_depth); | |
1427 | printk(KERN_INFO " di_entries = %u\n", di->di_entries); | |
1428 | printk(KERN_INFO " di_eattr = %llu\n", | |
1429 | (unsigned long long)di->di_eattr); | |
1430 | } | |
1431 |