/kern_2.6.32/fs/gfs2/glops.c

http://omnia2droid.googlecode.com/ · C · 459 lines · 276 code · 66 blank · 117 comment · 44 complexity · 0a2cf69b1024eafecc993a22dfdea26c MD5 · raw file

  1. /*
  2. * Copyright (C) Sistina Software, Inc. 1997-2003 All rights reserved.
  3. * Copyright (C) 2004-2008 Red Hat, Inc. All rights reserved.
  4. *
  5. * This copyrighted material is made available to anyone wishing to use,
  6. * modify, copy, or redistribute it subject to the terms and conditions
  7. * of the GNU General Public License version 2.
  8. */
  9. #include <linux/slab.h>
  10. #include <linux/spinlock.h>
  11. #include <linux/completion.h>
  12. #include <linux/buffer_head.h>
  13. #include <linux/gfs2_ondisk.h>
  14. #include <linux/bio.h>
  15. #include "gfs2.h"
  16. #include "incore.h"
  17. #include "bmap.h"
  18. #include "glock.h"
  19. #include "glops.h"
  20. #include "inode.h"
  21. #include "log.h"
  22. #include "meta_io.h"
  23. #include "recovery.h"
  24. #include "rgrp.h"
  25. #include "util.h"
  26. #include "trans.h"
  27. /**
  28. * ail_empty_gl - remove all buffers for a given lock from the AIL
  29. * @gl: the glock
  30. *
  31. * None of the buffers should be dirty, locked, or pinned.
  32. */
  33. static void gfs2_ail_empty_gl(struct gfs2_glock *gl)
  34. {
  35. struct gfs2_sbd *sdp = gl->gl_sbd;
  36. struct list_head *head = &gl->gl_ail_list;
  37. struct gfs2_bufdata *bd;
  38. struct buffer_head *bh;
  39. struct gfs2_trans tr;
  40. memset(&tr, 0, sizeof(tr));
  41. tr.tr_revokes = atomic_read(&gl->gl_ail_count);
  42. if (!tr.tr_revokes)
  43. return;
  44. /* A shortened, inline version of gfs2_trans_begin() */
  45. tr.tr_reserved = 1 + gfs2_struct2blk(sdp, tr.tr_revokes, sizeof(u64));
  46. tr.tr_ip = (unsigned long)__builtin_return_address(0);
  47. INIT_LIST_HEAD(&tr.tr_list_buf);
  48. gfs2_log_reserve(sdp, tr.tr_reserved);
  49. BUG_ON(current->journal_info);
  50. current->journal_info = &tr;
  51. gfs2_log_lock(sdp);
  52. while (!list_empty(head)) {
  53. bd = list_entry(head->next, struct gfs2_bufdata,
  54. bd_ail_gl_list);
  55. bh = bd->bd_bh;
  56. gfs2_remove_from_ail(bd);
  57. bd->bd_bh = NULL;
  58. bh->b_private = NULL;
  59. bd->bd_blkno = bh->b_blocknr;
  60. gfs2_assert_withdraw(sdp, !buffer_busy(bh));
  61. gfs2_trans_add_revoke(sdp, bd);
  62. }
  63. gfs2_assert_withdraw(sdp, !atomic_read(&gl->gl_ail_count));
  64. gfs2_log_unlock(sdp);
  65. gfs2_trans_end(sdp);
  66. gfs2_log_flush(sdp, NULL);
  67. }
  68. /**
  69. * rgrp_go_sync - sync out the metadata for this glock
  70. * @gl: the glock
  71. *
  72. * Called when demoting or unlocking an EX glock. We must flush
  73. * to disk all dirty buffers/pages relating to this glock, and must not
  74. * not return to caller to demote/unlock the glock until I/O is complete.
  75. */
  76. static void rgrp_go_sync(struct gfs2_glock *gl)
  77. {
  78. struct address_space *metamapping = gl->gl_aspace->i_mapping;
  79. int error;
  80. if (!test_and_clear_bit(GLF_DIRTY, &gl->gl_flags))
  81. return;
  82. BUG_ON(gl->gl_state != LM_ST_EXCLUSIVE);
  83. gfs2_log_flush(gl->gl_sbd, gl);
  84. filemap_fdatawrite(metamapping);
  85. error = filemap_fdatawait(metamapping);
  86. mapping_set_error(metamapping, error);
  87. gfs2_ail_empty_gl(gl);
  88. }
  89. /**
  90. * rgrp_go_inval - invalidate the metadata for this glock
  91. * @gl: the glock
  92. * @flags:
  93. *
  94. * We never used LM_ST_DEFERRED with resource groups, so that we
  95. * should always see the metadata flag set here.
  96. *
  97. */
  98. static void rgrp_go_inval(struct gfs2_glock *gl, int flags)
  99. {
  100. struct address_space *mapping = gl->gl_aspace->i_mapping;
  101. BUG_ON(!(flags & DIO_METADATA));
  102. gfs2_assert_withdraw(gl->gl_sbd, !atomic_read(&gl->gl_ail_count));
  103. truncate_inode_pages(mapping, 0);
  104. if (gl->gl_object) {
  105. struct gfs2_rgrpd *rgd = (struct gfs2_rgrpd *)gl->gl_object;
  106. rgd->rd_flags &= ~GFS2_RDF_UPTODATE;
  107. }
  108. }
  109. /**
  110. * inode_go_sync - Sync the dirty data and/or metadata for an inode glock
  111. * @gl: the glock protecting the inode
  112. *
  113. */
  114. static void inode_go_sync(struct gfs2_glock *gl)
  115. {
  116. struct gfs2_inode *ip = gl->gl_object;
  117. struct address_space *metamapping = gl->gl_aspace->i_mapping;
  118. int error;
  119. if (ip && !S_ISREG(ip->i_inode.i_mode))
  120. ip = NULL;
  121. if (ip && test_and_clear_bit(GIF_SW_PAGED, &ip->i_flags))
  122. unmap_shared_mapping_range(ip->i_inode.i_mapping, 0, 0);
  123. if (!test_and_clear_bit(GLF_DIRTY, &gl->gl_flags))
  124. return;
  125. BUG_ON(gl->gl_state != LM_ST_EXCLUSIVE);
  126. gfs2_log_flush(gl->gl_sbd, gl);
  127. filemap_fdatawrite(metamapping);
  128. if (ip) {
  129. struct address_space *mapping = ip->i_inode.i_mapping;
  130. filemap_fdatawrite(mapping);
  131. error = filemap_fdatawait(mapping);
  132. mapping_set_error(mapping, error);
  133. }
  134. error = filemap_fdatawait(metamapping);
  135. mapping_set_error(metamapping, error);
  136. gfs2_ail_empty_gl(gl);
  137. /*
  138. * Writeback of the data mapping may cause the dirty flag to be set
  139. * so we have to clear it again here.
  140. */
  141. smp_mb__before_clear_bit();
  142. clear_bit(GLF_DIRTY, &gl->gl_flags);
  143. }
  144. /**
  145. * inode_go_inval - prepare a inode glock to be released
  146. * @gl: the glock
  147. * @flags:
  148. *
  149. * Normally we invlidate everything, but if we are moving into
  150. * LM_ST_DEFERRED from LM_ST_SHARED or LM_ST_EXCLUSIVE then we
  151. * can keep hold of the metadata, since it won't have changed.
  152. *
  153. */
  154. static void inode_go_inval(struct gfs2_glock *gl, int flags)
  155. {
  156. struct gfs2_inode *ip = gl->gl_object;
  157. gfs2_assert_withdraw(gl->gl_sbd, !atomic_read(&gl->gl_ail_count));
  158. if (flags & DIO_METADATA) {
  159. struct address_space *mapping = gl->gl_aspace->i_mapping;
  160. truncate_inode_pages(mapping, 0);
  161. if (ip)
  162. set_bit(GIF_INVALID, &ip->i_flags);
  163. }
  164. if (ip == GFS2_I(gl->gl_sbd->sd_rindex))
  165. gl->gl_sbd->sd_rindex_uptodate = 0;
  166. if (ip && S_ISREG(ip->i_inode.i_mode))
  167. truncate_inode_pages(ip->i_inode.i_mapping, 0);
  168. }
  169. /**
  170. * inode_go_demote_ok - Check to see if it's ok to unlock an inode glock
  171. * @gl: the glock
  172. *
  173. * Returns: 1 if it's ok
  174. */
  175. static int inode_go_demote_ok(const struct gfs2_glock *gl)
  176. {
  177. struct gfs2_sbd *sdp = gl->gl_sbd;
  178. if (sdp->sd_jindex == gl->gl_object || sdp->sd_rindex == gl->gl_object)
  179. return 0;
  180. return 1;
  181. }
  182. /**
  183. * inode_go_lock - operation done after an inode lock is locked by a process
  184. * @gl: the glock
  185. * @flags:
  186. *
  187. * Returns: errno
  188. */
  189. static int inode_go_lock(struct gfs2_holder *gh)
  190. {
  191. struct gfs2_glock *gl = gh->gh_gl;
  192. struct gfs2_sbd *sdp = gl->gl_sbd;
  193. struct gfs2_inode *ip = gl->gl_object;
  194. int error = 0;
  195. if (!ip || (gh->gh_flags & GL_SKIP))
  196. return 0;
  197. if (test_bit(GIF_INVALID, &ip->i_flags)) {
  198. error = gfs2_inode_refresh(ip);
  199. if (error)
  200. return error;
  201. }
  202. if ((ip->i_diskflags & GFS2_DIF_TRUNC_IN_PROG) &&
  203. (gl->gl_state == LM_ST_EXCLUSIVE) &&
  204. (gh->gh_state == LM_ST_EXCLUSIVE)) {
  205. spin_lock(&sdp->sd_trunc_lock);
  206. if (list_empty(&ip->i_trunc_list))
  207. list_add(&sdp->sd_trunc_list, &ip->i_trunc_list);
  208. spin_unlock(&sdp->sd_trunc_lock);
  209. wake_up(&sdp->sd_quota_wait);
  210. return 1;
  211. }
  212. return error;
  213. }
  214. /**
  215. * inode_go_dump - print information about an inode
  216. * @seq: The iterator
  217. * @ip: the inode
  218. *
  219. * Returns: 0 on success, -ENOBUFS when we run out of space
  220. */
  221. static int inode_go_dump(struct seq_file *seq, const struct gfs2_glock *gl)
  222. {
  223. const struct gfs2_inode *ip = gl->gl_object;
  224. if (ip == NULL)
  225. return 0;
  226. gfs2_print_dbg(seq, " I: n:%llu/%llu t:%u f:0x%02lx d:0x%08x s:%llu/%llu\n",
  227. (unsigned long long)ip->i_no_formal_ino,
  228. (unsigned long long)ip->i_no_addr,
  229. IF2DT(ip->i_inode.i_mode), ip->i_flags,
  230. (unsigned int)ip->i_diskflags,
  231. (unsigned long long)ip->i_inode.i_size,
  232. (unsigned long long)ip->i_disksize);
  233. return 0;
  234. }
  235. /**
  236. * rgrp_go_demote_ok - Check to see if it's ok to unlock a RG's glock
  237. * @gl: the glock
  238. *
  239. * Returns: 1 if it's ok
  240. */
  241. static int rgrp_go_demote_ok(const struct gfs2_glock *gl)
  242. {
  243. return !gl->gl_aspace->i_mapping->nrpages;
  244. }
  245. /**
  246. * rgrp_go_lock - operation done after an rgrp lock is locked by
  247. * a first holder on this node.
  248. * @gl: the glock
  249. * @flags:
  250. *
  251. * Returns: errno
  252. */
  253. static int rgrp_go_lock(struct gfs2_holder *gh)
  254. {
  255. return gfs2_rgrp_bh_get(gh->gh_gl->gl_object);
  256. }
  257. /**
  258. * rgrp_go_unlock - operation done before an rgrp lock is unlocked by
  259. * a last holder on this node.
  260. * @gl: the glock
  261. * @flags:
  262. *
  263. */
  264. static void rgrp_go_unlock(struct gfs2_holder *gh)
  265. {
  266. gfs2_rgrp_bh_put(gh->gh_gl->gl_object);
  267. }
  268. /**
  269. * trans_go_sync - promote/demote the transaction glock
  270. * @gl: the glock
  271. * @state: the requested state
  272. * @flags:
  273. *
  274. */
  275. static void trans_go_sync(struct gfs2_glock *gl)
  276. {
  277. struct gfs2_sbd *sdp = gl->gl_sbd;
  278. if (gl->gl_state != LM_ST_UNLOCKED &&
  279. test_bit(SDF_JOURNAL_LIVE, &sdp->sd_flags)) {
  280. flush_workqueue(gfs2_delete_workqueue);
  281. gfs2_meta_syncfs(sdp);
  282. gfs2_log_shutdown(sdp);
  283. }
  284. }
  285. /**
  286. * trans_go_xmote_bh - After promoting/demoting the transaction glock
  287. * @gl: the glock
  288. *
  289. */
  290. static int trans_go_xmote_bh(struct gfs2_glock *gl, struct gfs2_holder *gh)
  291. {
  292. struct gfs2_sbd *sdp = gl->gl_sbd;
  293. struct gfs2_inode *ip = GFS2_I(sdp->sd_jdesc->jd_inode);
  294. struct gfs2_glock *j_gl = ip->i_gl;
  295. struct gfs2_log_header_host head;
  296. int error;
  297. if (test_bit(SDF_JOURNAL_LIVE, &sdp->sd_flags)) {
  298. j_gl->gl_ops->go_inval(j_gl, DIO_METADATA);
  299. error = gfs2_find_jhead(sdp->sd_jdesc, &head);
  300. if (error)
  301. gfs2_consist(sdp);
  302. if (!(head.lh_flags & GFS2_LOG_HEAD_UNMOUNT))
  303. gfs2_consist(sdp);
  304. /* Initialize some head of the log stuff */
  305. if (!test_bit(SDF_SHUTDOWN, &sdp->sd_flags)) {
  306. sdp->sd_log_sequence = head.lh_sequence + 1;
  307. gfs2_log_pointers_init(sdp, head.lh_blkno);
  308. }
  309. }
  310. return 0;
  311. }
  312. /**
  313. * trans_go_demote_ok
  314. * @gl: the glock
  315. *
  316. * Always returns 0
  317. */
  318. static int trans_go_demote_ok(const struct gfs2_glock *gl)
  319. {
  320. return 0;
  321. }
  322. /**
  323. * iopen_go_callback - schedule the dcache entry for the inode to be deleted
  324. * @gl: the glock
  325. *
  326. * gl_spin lock is held while calling this
  327. */
  328. static void iopen_go_callback(struct gfs2_glock *gl)
  329. {
  330. struct gfs2_inode *ip = (struct gfs2_inode *)gl->gl_object;
  331. if (gl->gl_demote_state == LM_ST_UNLOCKED &&
  332. gl->gl_state == LM_ST_SHARED &&
  333. ip && test_bit(GIF_USER, &ip->i_flags)) {
  334. gfs2_glock_hold(gl);
  335. if (queue_work(gfs2_delete_workqueue, &gl->gl_delete) == 0)
  336. gfs2_glock_put_nolock(gl);
  337. }
  338. }
  339. const struct gfs2_glock_operations gfs2_meta_glops = {
  340. .go_type = LM_TYPE_META,
  341. };
  342. const struct gfs2_glock_operations gfs2_inode_glops = {
  343. .go_xmote_th = inode_go_sync,
  344. .go_inval = inode_go_inval,
  345. .go_demote_ok = inode_go_demote_ok,
  346. .go_lock = inode_go_lock,
  347. .go_dump = inode_go_dump,
  348. .go_type = LM_TYPE_INODE,
  349. .go_min_hold_time = HZ / 5,
  350. };
  351. const struct gfs2_glock_operations gfs2_rgrp_glops = {
  352. .go_xmote_th = rgrp_go_sync,
  353. .go_inval = rgrp_go_inval,
  354. .go_demote_ok = rgrp_go_demote_ok,
  355. .go_lock = rgrp_go_lock,
  356. .go_unlock = rgrp_go_unlock,
  357. .go_dump = gfs2_rgrp_dump,
  358. .go_type = LM_TYPE_RGRP,
  359. .go_min_hold_time = HZ / 5,
  360. };
  361. const struct gfs2_glock_operations gfs2_trans_glops = {
  362. .go_xmote_th = trans_go_sync,
  363. .go_xmote_bh = trans_go_xmote_bh,
  364. .go_demote_ok = trans_go_demote_ok,
  365. .go_type = LM_TYPE_NONDISK,
  366. };
  367. const struct gfs2_glock_operations gfs2_iopen_glops = {
  368. .go_type = LM_TYPE_IOPEN,
  369. .go_callback = iopen_go_callback,
  370. };
  371. const struct gfs2_glock_operations gfs2_flock_glops = {
  372. .go_type = LM_TYPE_FLOCK,
  373. };
  374. const struct gfs2_glock_operations gfs2_nondisk_glops = {
  375. .go_type = LM_TYPE_NONDISK,
  376. };
  377. const struct gfs2_glock_operations gfs2_quota_glops = {
  378. .go_type = LM_TYPE_QUOTA,
  379. };
  380. const struct gfs2_glock_operations gfs2_journal_glops = {
  381. .go_type = LM_TYPE_JOURNAL,
  382. };
  383. const struct gfs2_glock_operations *gfs2_glops_list[] = {
  384. [LM_TYPE_META] = &gfs2_meta_glops,
  385. [LM_TYPE_INODE] = &gfs2_inode_glops,
  386. [LM_TYPE_RGRP] = &gfs2_rgrp_glops,
  387. [LM_TYPE_NONDISK] = &gfs2_trans_glops,
  388. [LM_TYPE_IOPEN] = &gfs2_iopen_glops,
  389. [LM_TYPE_FLOCK] = &gfs2_flock_glops,
  390. [LM_TYPE_NONDISK] = &gfs2_nondisk_glops,
  391. [LM_TYPE_QUOTA] = &gfs2_quota_glops,
  392. [LM_TYPE_JOURNAL] = &gfs2_journal_glops,
  393. };