Commit | Line | Data |
---|---|---|
b3b94faa DT |
1 | /* |
2 | * Copyright (C) Sistina Software, Inc. 1997-2003 All rights reserved. | |
cf45b752 | 3 | * Copyright (C) 2004-2008 Red Hat, Inc. All rights reserved. |
b3b94faa DT |
4 | * |
5 | * This copyrighted material is made available to anyone wishing to use, | |
6 | * modify, copy, or redistribute it subject to the terms and conditions | |
e9fc2aa0 | 7 | * of the GNU General Public License version 2. |
b3b94faa DT |
8 | */ |
9 | ||
b3b94faa DT |
10 | #include <linux/slab.h> |
11 | #include <linux/spinlock.h> | |
12 | #include <linux/completion.h> | |
13 | #include <linux/buffer_head.h> | |
5c676f6d | 14 | #include <linux/gfs2_ondisk.h> |
6802e340 | 15 | #include <linux/bio.h> |
b3b94faa DT |
16 | |
17 | #include "gfs2.h" | |
5c676f6d | 18 | #include "incore.h" |
b3b94faa DT |
19 | #include "bmap.h" |
20 | #include "glock.h" | |
21 | #include "glops.h" | |
22 | #include "inode.h" | |
23 | #include "log.h" | |
24 | #include "meta_io.h" | |
b3b94faa DT |
25 | #include "recovery.h" |
26 | #include "rgrp.h" | |
5c676f6d | 27 | #include "util.h" |
ddacfaf7 | 28 | #include "trans.h" |
b3b94faa | 29 | |
ddacfaf7 SW |
30 | /** |
31 | * ail_empty_gl - remove all buffers for a given lock from the AIL | |
32 | * @gl: the glock | |
33 | * | |
34 | * None of the buffers should be dirty, locked, or pinned. | |
35 | */ | |
36 | ||
37 | static void gfs2_ail_empty_gl(struct gfs2_glock *gl) | |
38 | { | |
39 | struct gfs2_sbd *sdp = gl->gl_sbd; | |
ddacfaf7 SW |
40 | struct list_head *head = &gl->gl_ail_list; |
41 | struct gfs2_bufdata *bd; | |
42 | struct buffer_head *bh; | |
d8348de0 | 43 | struct gfs2_trans tr; |
ddacfaf7 | 44 | |
d8348de0 SW |
45 | memset(&tr, 0, sizeof(tr)); |
46 | tr.tr_revokes = atomic_read(&gl->gl_ail_count); | |
ddacfaf7 | 47 | |
d8348de0 | 48 | if (!tr.tr_revokes) |
ddacfaf7 SW |
49 | return; |
50 | ||
d8348de0 SW |
51 | /* A shortened, inline version of gfs2_trans_begin() */ |
52 | tr.tr_reserved = 1 + gfs2_struct2blk(sdp, tr.tr_revokes, sizeof(u64)); | |
53 | tr.tr_ip = (unsigned long)__builtin_return_address(0); | |
54 | INIT_LIST_HEAD(&tr.tr_list_buf); | |
55 | gfs2_log_reserve(sdp, tr.tr_reserved); | |
56 | BUG_ON(current->journal_info); | |
57 | current->journal_info = &tr; | |
58 | ||
ddacfaf7 SW |
59 | gfs2_log_lock(sdp); |
60 | while (!list_empty(head)) { | |
61 | bd = list_entry(head->next, struct gfs2_bufdata, | |
62 | bd_ail_gl_list); | |
63 | bh = bd->bd_bh; | |
f91a0d3e | 64 | gfs2_remove_from_ail(bd); |
1ad38c43 SW |
65 | bd->bd_bh = NULL; |
66 | bh->b_private = NULL; | |
67 | bd->bd_blkno = bh->b_blocknr; | |
68 | gfs2_assert_withdraw(sdp, !buffer_busy(bh)); | |
69 | gfs2_trans_add_revoke(sdp, bd); | |
ddacfaf7 SW |
70 | } |
71 | gfs2_assert_withdraw(sdp, !atomic_read(&gl->gl_ail_count)); | |
72 | gfs2_log_unlock(sdp); | |
73 | ||
74 | gfs2_trans_end(sdp); | |
75 | gfs2_log_flush(sdp, NULL); | |
76 | } | |
ba7f7290 SW |
77 | |
78 | /** | |
6bac243f | 79 | * rgrp_go_sync - sync out the metadata for this glock |
b3b94faa | 80 | * @gl: the glock |
b3b94faa DT |
81 | * |
82 | * Called when demoting or unlocking an EX glock. We must flush | |
83 | * to disk all dirty buffers/pages relating to this glock, and must not | |
84 | * not return to caller to demote/unlock the glock until I/O is complete. | |
85 | */ | |
86 | ||
6bac243f | 87 | static void rgrp_go_sync(struct gfs2_glock *gl) |
b3b94faa | 88 | { |
6bac243f SW |
89 | struct address_space *metamapping = gl->gl_aspace->i_mapping; |
90 | int error; | |
91 | ||
92 | if (!test_and_clear_bit(GLF_DIRTY, &gl->gl_flags)) | |
b5d32bea | 93 | return; |
6bac243f | 94 | BUG_ON(gl->gl_state != LM_ST_EXCLUSIVE); |
b5d32bea | 95 | |
6bac243f SW |
96 | gfs2_log_flush(gl->gl_sbd, gl); |
97 | filemap_fdatawrite(metamapping); | |
98 | error = filemap_fdatawait(metamapping); | |
99 | mapping_set_error(metamapping, error); | |
100 | gfs2_ail_empty_gl(gl); | |
b3b94faa DT |
101 | } |
102 | ||
103 | /** | |
6bac243f | 104 | * rgrp_go_inval - invalidate the metadata for this glock |
b3b94faa DT |
105 | * @gl: the glock |
106 | * @flags: | |
107 | * | |
6bac243f SW |
108 | * We never used LM_ST_DEFERRED with resource groups, so that we |
109 | * should always see the metadata flag set here. | |
110 | * | |
b3b94faa DT |
111 | */ |
112 | ||
6bac243f | 113 | static void rgrp_go_inval(struct gfs2_glock *gl, int flags) |
b3b94faa | 114 | { |
6bac243f | 115 | struct address_space *mapping = gl->gl_aspace->i_mapping; |
b3b94faa | 116 | |
6bac243f SW |
117 | BUG_ON(!(flags & DIO_METADATA)); |
118 | gfs2_assert_withdraw(gl->gl_sbd, !atomic_read(&gl->gl_ail_count)); | |
119 | truncate_inode_pages(mapping, 0); | |
cf45b752 | 120 | |
6bac243f SW |
121 | if (gl->gl_object) { |
122 | struct gfs2_rgrpd *rgd = (struct gfs2_rgrpd *)gl->gl_object; | |
cf45b752 BP |
123 | rgd->rd_flags &= ~GFS2_RDF_UPTODATE; |
124 | } | |
b3b94faa DT |
125 | } |
126 | ||
b5d32bea SW |
127 | /** |
128 | * inode_go_sync - Sync the dirty data and/or metadata for an inode glock | |
129 | * @gl: the glock protecting the inode | |
130 | * | |
131 | */ | |
132 | ||
133 | static void inode_go_sync(struct gfs2_glock *gl) | |
134 | { | |
135 | struct gfs2_inode *ip = gl->gl_object; | |
3042a2cc SW |
136 | struct address_space *metamapping = gl->gl_aspace->i_mapping; |
137 | int error; | |
138 | ||
b5d32bea SW |
139 | if (ip && !S_ISREG(ip->i_inode.i_mode)) |
140 | ip = NULL; | |
6bac243f SW |
141 | if (ip && test_and_clear_bit(GIF_SW_PAGED, &ip->i_flags)) |
142 | unmap_shared_mapping_range(ip->i_inode.i_mapping, 0, 0); | |
143 | if (!test_and_clear_bit(GLF_DIRTY, &gl->gl_flags)) | |
144 | return; | |
b5d32bea | 145 | |
6bac243f SW |
146 | BUG_ON(gl->gl_state != LM_ST_EXCLUSIVE); |
147 | ||
148 | gfs2_log_flush(gl->gl_sbd, gl); | |
149 | filemap_fdatawrite(metamapping); | |
150 | if (ip) { | |
151 | struct address_space *mapping = ip->i_inode.i_mapping; | |
152 | filemap_fdatawrite(mapping); | |
153 | error = filemap_fdatawait(mapping); | |
154 | mapping_set_error(mapping, error); | |
b5d32bea | 155 | } |
6bac243f SW |
156 | error = filemap_fdatawait(metamapping); |
157 | mapping_set_error(metamapping, error); | |
158 | gfs2_ail_empty_gl(gl); | |
52fcd11c SW |
159 | /* |
160 | * Writeback of the data mapping may cause the dirty flag to be set | |
161 | * so we have to clear it again here. | |
162 | */ | |
163 | smp_mb__before_clear_bit(); | |
164 | clear_bit(GLF_DIRTY, &gl->gl_flags); | |
b5d32bea SW |
165 | } |
166 | ||
b3b94faa DT |
167 | /** |
168 | * inode_go_inval - prepare a inode glock to be released | |
169 | * @gl: the glock | |
170 | * @flags: | |
6bac243f SW |
171 | * |
172 | * Normally we invlidate everything, but if we are moving into | |
173 | * LM_ST_DEFERRED from LM_ST_SHARED or LM_ST_EXCLUSIVE then we | |
174 | * can keep hold of the metadata, since it won't have changed. | |
b3b94faa DT |
175 | * |
176 | */ | |
177 | ||
178 | static void inode_go_inval(struct gfs2_glock *gl, int flags) | |
179 | { | |
b004157a | 180 | struct gfs2_inode *ip = gl->gl_object; |
b3b94faa | 181 | |
6bac243f SW |
182 | gfs2_assert_withdraw(gl->gl_sbd, !atomic_read(&gl->gl_ail_count)); |
183 | ||
184 | if (flags & DIO_METADATA) { | |
185 | struct address_space *mapping = gl->gl_aspace->i_mapping; | |
186 | truncate_inode_pages(mapping, 0); | |
b004157a SW |
187 | if (ip) |
188 | set_bit(GIF_INVALID, &ip->i_flags); | |
189 | } | |
190 | ||
6bac243f SW |
191 | if (ip == GFS2_I(gl->gl_sbd->sd_rindex)) |
192 | gl->gl_sbd->sd_rindex_uptodate = 0; | |
3cc3f710 | 193 | if (ip && S_ISREG(ip->i_inode.i_mode)) |
b004157a | 194 | truncate_inode_pages(ip->i_inode.i_mapping, 0); |
b3b94faa DT |
195 | } |
196 | ||
197 | /** | |
198 | * inode_go_demote_ok - Check to see if it's ok to unlock an inode glock | |
199 | * @gl: the glock | |
200 | * | |
201 | * Returns: 1 if it's ok | |
202 | */ | |
203 | ||
97cc1025 | 204 | static int inode_go_demote_ok(const struct gfs2_glock *gl) |
b3b94faa DT |
205 | { |
206 | struct gfs2_sbd *sdp = gl->gl_sbd; | |
97cc1025 SW |
207 | if (sdp->sd_jindex == gl->gl_object || sdp->sd_rindex == gl->gl_object) |
208 | return 0; | |
209 | return 1; | |
b3b94faa DT |
210 | } |
211 | ||
212 | /** | |
213 | * inode_go_lock - operation done after an inode lock is locked by a process | |
214 | * @gl: the glock | |
215 | * @flags: | |
216 | * | |
217 | * Returns: errno | |
218 | */ | |
219 | ||
220 | static int inode_go_lock(struct gfs2_holder *gh) | |
221 | { | |
222 | struct gfs2_glock *gl = gh->gh_gl; | |
813e0c46 | 223 | struct gfs2_sbd *sdp = gl->gl_sbd; |
5c676f6d | 224 | struct gfs2_inode *ip = gl->gl_object; |
b3b94faa DT |
225 | int error = 0; |
226 | ||
091806ed | 227 | if (!ip || (gh->gh_flags & GL_SKIP)) |
b3b94faa DT |
228 | return 0; |
229 | ||
bfded27b | 230 | if (test_bit(GIF_INVALID, &ip->i_flags)) { |
b3b94faa DT |
231 | error = gfs2_inode_refresh(ip); |
232 | if (error) | |
233 | return error; | |
b3b94faa DT |
234 | } |
235 | ||
383f01fb | 236 | if ((ip->i_diskflags & GFS2_DIF_TRUNC_IN_PROG) && |
b3b94faa | 237 | (gl->gl_state == LM_ST_EXCLUSIVE) && |
813e0c46 SW |
238 | (gh->gh_state == LM_ST_EXCLUSIVE)) { |
239 | spin_lock(&sdp->sd_trunc_lock); | |
240 | if (list_empty(&ip->i_trunc_list)) | |
241 | list_add(&sdp->sd_trunc_list, &ip->i_trunc_list); | |
242 | spin_unlock(&sdp->sd_trunc_lock); | |
243 | wake_up(&sdp->sd_quota_wait); | |
244 | return 1; | |
245 | } | |
b3b94faa DT |
246 | |
247 | return error; | |
248 | } | |
249 | ||
6802e340 SW |
250 | /** |
251 | * inode_go_dump - print information about an inode | |
252 | * @seq: The iterator | |
253 | * @ip: the inode | |
254 | * | |
255 | * Returns: 0 on success, -ENOBUFS when we run out of space | |
256 | */ | |
257 | ||
258 | static int inode_go_dump(struct seq_file *seq, const struct gfs2_glock *gl) | |
259 | { | |
260 | const struct gfs2_inode *ip = gl->gl_object; | |
261 | if (ip == NULL) | |
262 | return 0; | |
fa75cedc | 263 | gfs2_print_dbg(seq, " I: n:%llu/%llu t:%u f:0x%02lx d:0x%08x s:%llu/%llu\n", |
6802e340 SW |
264 | (unsigned long long)ip->i_no_formal_ino, |
265 | (unsigned long long)ip->i_no_addr, | |
fa75cedc SW |
266 | IF2DT(ip->i_inode.i_mode), ip->i_flags, |
267 | (unsigned int)ip->i_diskflags, | |
268 | (unsigned long long)ip->i_inode.i_size, | |
269 | (unsigned long long)ip->i_disksize); | |
6802e340 SW |
270 | return 0; |
271 | } | |
272 | ||
b3b94faa DT |
273 | /** |
274 | * rgrp_go_demote_ok - Check to see if it's ok to unlock a RG's glock | |
275 | * @gl: the glock | |
276 | * | |
277 | * Returns: 1 if it's ok | |
278 | */ | |
279 | ||
97cc1025 | 280 | static int rgrp_go_demote_ok(const struct gfs2_glock *gl) |
b3b94faa DT |
281 | { |
282 | return !gl->gl_aspace->i_mapping->nrpages; | |
283 | } | |
284 | ||
285 | /** | |
286 | * rgrp_go_lock - operation done after an rgrp lock is locked by | |
287 | * a first holder on this node. | |
288 | * @gl: the glock | |
289 | * @flags: | |
290 | * | |
291 | * Returns: errno | |
292 | */ | |
293 | ||
294 | static int rgrp_go_lock(struct gfs2_holder *gh) | |
295 | { | |
5c676f6d | 296 | return gfs2_rgrp_bh_get(gh->gh_gl->gl_object); |
b3b94faa DT |
297 | } |
298 | ||
299 | /** | |
300 | * rgrp_go_unlock - operation done before an rgrp lock is unlocked by | |
301 | * a last holder on this node. | |
302 | * @gl: the glock | |
303 | * @flags: | |
304 | * | |
305 | */ | |
306 | ||
307 | static void rgrp_go_unlock(struct gfs2_holder *gh) | |
308 | { | |
5c676f6d | 309 | gfs2_rgrp_bh_put(gh->gh_gl->gl_object); |
b3b94faa DT |
310 | } |
311 | ||
312 | /** | |
3042a2cc | 313 | * trans_go_sync - promote/demote the transaction glock |
b3b94faa DT |
314 | * @gl: the glock |
315 | * @state: the requested state | |
316 | * @flags: | |
317 | * | |
318 | */ | |
319 | ||
3042a2cc | 320 | static void trans_go_sync(struct gfs2_glock *gl) |
b3b94faa DT |
321 | { |
322 | struct gfs2_sbd *sdp = gl->gl_sbd; | |
323 | ||
324 | if (gl->gl_state != LM_ST_UNLOCKED && | |
325 | test_bit(SDF_JOURNAL_LIVE, &sdp->sd_flags)) { | |
b94a170e | 326 | flush_workqueue(gfs2_delete_workqueue); |
b3b94faa DT |
327 | gfs2_meta_syncfs(sdp); |
328 | gfs2_log_shutdown(sdp); | |
329 | } | |
b3b94faa DT |
330 | } |
331 | ||
332 | /** | |
333 | * trans_go_xmote_bh - After promoting/demoting the transaction glock | |
334 | * @gl: the glock | |
335 | * | |
336 | */ | |
337 | ||
6802e340 | 338 | static int trans_go_xmote_bh(struct gfs2_glock *gl, struct gfs2_holder *gh) |
b3b94faa DT |
339 | { |
340 | struct gfs2_sbd *sdp = gl->gl_sbd; | |
feaa7bba | 341 | struct gfs2_inode *ip = GFS2_I(sdp->sd_jdesc->jd_inode); |
5c676f6d | 342 | struct gfs2_glock *j_gl = ip->i_gl; |
55167622 | 343 | struct gfs2_log_header_host head; |
b3b94faa DT |
344 | int error; |
345 | ||
6802e340 | 346 | if (test_bit(SDF_JOURNAL_LIVE, &sdp->sd_flags)) { |
1a14d3a6 | 347 | j_gl->gl_ops->go_inval(j_gl, DIO_METADATA); |
b3b94faa DT |
348 | |
349 | error = gfs2_find_jhead(sdp->sd_jdesc, &head); | |
350 | if (error) | |
351 | gfs2_consist(sdp); | |
352 | if (!(head.lh_flags & GFS2_LOG_HEAD_UNMOUNT)) | |
353 | gfs2_consist(sdp); | |
354 | ||
355 | /* Initialize some head of the log stuff */ | |
356 | if (!test_bit(SDF_SHUTDOWN, &sdp->sd_flags)) { | |
357 | sdp->sd_log_sequence = head.lh_sequence + 1; | |
358 | gfs2_log_pointers_init(sdp, head.lh_blkno); | |
359 | } | |
360 | } | |
6802e340 | 361 | return 0; |
b3b94faa DT |
362 | } |
363 | ||
97cc1025 SW |
364 | /** |
365 | * trans_go_demote_ok | |
366 | * @gl: the glock | |
367 | * | |
368 | * Always returns 0 | |
369 | */ | |
370 | ||
371 | static int trans_go_demote_ok(const struct gfs2_glock *gl) | |
372 | { | |
373 | return 0; | |
374 | } | |
375 | ||
b94a170e BM |
376 | /** |
377 | * iopen_go_callback - schedule the dcache entry for the inode to be deleted | |
378 | * @gl: the glock | |
379 | * | |
380 | * gl_spin lock is held while calling this | |
381 | */ | |
382 | static void iopen_go_callback(struct gfs2_glock *gl) | |
383 | { | |
384 | struct gfs2_inode *ip = (struct gfs2_inode *)gl->gl_object; | |
385 | ||
386 | if (gl->gl_demote_state == LM_ST_UNLOCKED && | |
387 | gl->gl_state == LM_ST_SHARED && | |
388 | ip && test_bit(GIF_USER, &ip->i_flags)) { | |
389 | gfs2_glock_hold(gl); | |
390 | if (queue_work(gfs2_delete_workqueue, &gl->gl_delete) == 0) | |
391 | gfs2_glock_put_nolock(gl); | |
392 | } | |
393 | } | |
394 | ||
8fb4b536 | 395 | const struct gfs2_glock_operations gfs2_meta_glops = { |
ea67eedb | 396 | .go_type = LM_TYPE_META, |
b3b94faa DT |
397 | }; |
398 | ||
8fb4b536 | 399 | const struct gfs2_glock_operations gfs2_inode_glops = { |
3042a2cc | 400 | .go_xmote_th = inode_go_sync, |
b3b94faa DT |
401 | .go_inval = inode_go_inval, |
402 | .go_demote_ok = inode_go_demote_ok, | |
403 | .go_lock = inode_go_lock, | |
6802e340 | 404 | .go_dump = inode_go_dump, |
ea67eedb | 405 | .go_type = LM_TYPE_INODE, |
6802e340 | 406 | .go_min_hold_time = HZ / 5, |
b3b94faa DT |
407 | }; |
408 | ||
8fb4b536 | 409 | const struct gfs2_glock_operations gfs2_rgrp_glops = { |
6bac243f SW |
410 | .go_xmote_th = rgrp_go_sync, |
411 | .go_inval = rgrp_go_inval, | |
b3b94faa DT |
412 | .go_demote_ok = rgrp_go_demote_ok, |
413 | .go_lock = rgrp_go_lock, | |
414 | .go_unlock = rgrp_go_unlock, | |
09010978 | 415 | .go_dump = gfs2_rgrp_dump, |
ea67eedb | 416 | .go_type = LM_TYPE_RGRP, |
6802e340 | 417 | .go_min_hold_time = HZ / 5, |
b3b94faa DT |
418 | }; |
419 | ||
8fb4b536 | 420 | const struct gfs2_glock_operations gfs2_trans_glops = { |
3042a2cc | 421 | .go_xmote_th = trans_go_sync, |
b3b94faa | 422 | .go_xmote_bh = trans_go_xmote_bh, |
97cc1025 | 423 | .go_demote_ok = trans_go_demote_ok, |
ea67eedb | 424 | .go_type = LM_TYPE_NONDISK, |
b3b94faa DT |
425 | }; |
426 | ||
8fb4b536 | 427 | const struct gfs2_glock_operations gfs2_iopen_glops = { |
ea67eedb | 428 | .go_type = LM_TYPE_IOPEN, |
b94a170e | 429 | .go_callback = iopen_go_callback, |
b3b94faa DT |
430 | }; |
431 | ||
8fb4b536 | 432 | const struct gfs2_glock_operations gfs2_flock_glops = { |
ea67eedb | 433 | .go_type = LM_TYPE_FLOCK, |
b3b94faa DT |
434 | }; |
435 | ||
8fb4b536 | 436 | const struct gfs2_glock_operations gfs2_nondisk_glops = { |
ea67eedb | 437 | .go_type = LM_TYPE_NONDISK, |
b3b94faa DT |
438 | }; |
439 | ||
8fb4b536 | 440 | const struct gfs2_glock_operations gfs2_quota_glops = { |
ea67eedb | 441 | .go_type = LM_TYPE_QUOTA, |
b3b94faa DT |
442 | }; |
443 | ||
8fb4b536 | 444 | const struct gfs2_glock_operations gfs2_journal_glops = { |
ea67eedb | 445 | .go_type = LM_TYPE_JOURNAL, |
b3b94faa DT |
446 | }; |
447 | ||
64d576ba SW |
448 | const struct gfs2_glock_operations *gfs2_glops_list[] = { |
449 | [LM_TYPE_META] = &gfs2_meta_glops, | |
450 | [LM_TYPE_INODE] = &gfs2_inode_glops, | |
451 | [LM_TYPE_RGRP] = &gfs2_rgrp_glops, | |
452 | [LM_TYPE_NONDISK] = &gfs2_trans_glops, | |
453 | [LM_TYPE_IOPEN] = &gfs2_iopen_glops, | |
454 | [LM_TYPE_FLOCK] = &gfs2_flock_glops, | |
455 | [LM_TYPE_NONDISK] = &gfs2_nondisk_glops, | |
456 | [LM_TYPE_QUOTA] = &gfs2_quota_glops, | |
457 | [LM_TYPE_JOURNAL] = &gfs2_journal_glops, | |
458 | }; | |
459 |