the_nilfs.h 12 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397
  1. /*
  2. * the_nilfs.h - the_nilfs shared structure.
  3. *
  4. * Copyright (C) 2005-2008 Nippon Telegraph and Telephone Corporation.
  5. *
  6. * This program is free software; you can redistribute it and/or modify
  7. * it under the terms of the GNU General Public License as published by
  8. * the Free Software Foundation; either version 2 of the License, or
  9. * (at your option) any later version.
  10. *
  11. * This program is distributed in the hope that it will be useful,
  12. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  13. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  14. * GNU General Public License for more details.
  15. *
  16. * You should have received a copy of the GNU General Public License
  17. * along with this program; if not, write to the Free Software
  18. * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA
  19. *
  20. * Written by Ryusuke Konishi <ryusuke@osrg.net>
  21. *
  22. */
  23. #ifndef _THE_NILFS_H
  24. #define _THE_NILFS_H
  25. #include <linux/types.h>
  26. #include <linux/buffer_head.h>
  27. #include <linux/rbtree.h>
  28. #include <linux/fs.h>
  29. #include <linux/blkdev.h>
  30. #include <linux/backing-dev.h>
  31. #include <linux/slab.h>
  32. struct nilfs_sc_info;
  33. struct nilfs_sysfs_dev_subgroups;
  34. /* the_nilfs struct */
  35. enum {
  36. THE_NILFS_INIT = 0, /* Information from super_block is set */
  37. THE_NILFS_DISCONTINUED, /* 'next' pointer chain has broken */
  38. THE_NILFS_GC_RUNNING, /* gc process is running */
  39. THE_NILFS_SB_DIRTY, /* super block is dirty */
  40. };
  41. /**
  42. * struct the_nilfs - struct to supervise multiple nilfs mount points
  43. * @ns_flags: flags
  44. * @ns_flushed_device: flag indicating if all volatile data was flushed
  45. * @ns_bdev: block device
  46. * @ns_sem: semaphore for shared states
  47. * @ns_snapshot_mount_mutex: mutex to protect snapshot mounts
  48. * @ns_sbh: buffer heads of on-disk super blocks
  49. * @ns_sbp: pointers to super block data
  50. * @ns_sbwtime: previous write time of super block
  51. * @ns_sbwcount: write count of super block
  52. * @ns_sbsize: size of valid data in super block
  53. * @ns_mount_state: file system state
  54. * @ns_sb_update_freq: interval of periodical update of superblocks (in seconds)
  55. * @ns_seg_seq: segment sequence counter
  56. * @ns_segnum: index number of the latest full segment.
  57. * @ns_nextnum: index number of the full segment index to be used next
  58. * @ns_pseg_offset: offset of next partial segment in the current full segment
  59. * @ns_cno: next checkpoint number
  60. * @ns_ctime: write time of the last segment
  61. * @ns_nongc_ctime: write time of the last segment not for cleaner operation
  62. * @ns_ndirtyblks: Number of dirty data blocks
  63. * @ns_last_segment_lock: lock protecting fields for the latest segment
  64. * @ns_last_pseg: start block number of the latest segment
  65. * @ns_last_seq: sequence value of the latest segment
  66. * @ns_last_cno: checkpoint number of the latest segment
  67. * @ns_prot_seq: least sequence number of segments which must not be reclaimed
  68. * @ns_prev_seq: base sequence number used to decide if advance log cursor
  69. * @ns_writer: log writer
  70. * @ns_segctor_sem: semaphore protecting log write
  71. * @ns_dat: DAT file inode
  72. * @ns_cpfile: checkpoint file inode
  73. * @ns_sufile: segusage file inode
  74. * @ns_cptree: rb-tree of all mounted checkpoints (nilfs_root)
  75. * @ns_cptree_lock: lock protecting @ns_cptree
  76. * @ns_dirty_files: list of dirty files
  77. * @ns_inode_lock: lock protecting @ns_dirty_files
  78. * @ns_gc_inodes: dummy inodes to keep live blocks
  79. * @ns_next_generation: next generation number for inodes
  80. * @ns_next_gen_lock: lock protecting @ns_next_generation
  81. * @ns_mount_opt: mount options
  82. * @ns_resuid: uid for reserved blocks
  83. * @ns_resgid: gid for reserved blocks
  84. * @ns_interval: checkpoint creation interval
  85. * @ns_watermark: watermark for the number of dirty buffers
  86. * @ns_blocksize_bits: bit length of block size
  87. * @ns_blocksize: block size
  88. * @ns_nsegments: number of segments in filesystem
  89. * @ns_blocks_per_segment: number of blocks per segment
  90. * @ns_r_segments_percentage: reserved segments percentage
  91. * @ns_nrsvsegs: number of reserved segments
  92. * @ns_first_data_block: block number of first data block
  93. * @ns_inode_size: size of on-disk inode
  94. * @ns_first_ino: first not-special inode number
  95. * @ns_crc_seed: seed value of CRC32 calculation
  96. * @ns_dev_kobj: /sys/fs/<nilfs>/<device>
  97. * @ns_dev_kobj_unregister: completion state
  98. * @ns_dev_subgroups: <device> subgroups pointer
  99. */
  100. struct the_nilfs {
  101. unsigned long ns_flags;
  102. int ns_flushed_device;
  103. struct block_device *ns_bdev;
  104. struct rw_semaphore ns_sem;
  105. struct mutex ns_snapshot_mount_mutex;
  106. /*
  107. * used for
  108. * - loading the latest checkpoint exclusively.
  109. * - allocating a new full segment.
  110. */
  111. struct buffer_head *ns_sbh[2];
  112. struct nilfs_super_block *ns_sbp[2];
  113. time_t ns_sbwtime;
  114. unsigned ns_sbwcount;
  115. unsigned ns_sbsize;
  116. unsigned ns_mount_state;
  117. unsigned ns_sb_update_freq;
  118. /*
  119. * Following fields are dedicated to a writable FS-instance.
  120. * Except for the period seeking checkpoint, code outside the segment
  121. * constructor must lock a segment semaphore while accessing these
  122. * fields.
  123. * The writable FS-instance is sole during a lifetime of the_nilfs.
  124. */
  125. u64 ns_seg_seq;
  126. __u64 ns_segnum;
  127. __u64 ns_nextnum;
  128. unsigned long ns_pseg_offset;
  129. __u64 ns_cno;
  130. time_t ns_ctime;
  131. time_t ns_nongc_ctime;
  132. atomic_t ns_ndirtyblks;
  133. /*
  134. * The following fields hold information on the latest partial segment
  135. * written to disk with a super root. These fields are protected by
  136. * ns_last_segment_lock.
  137. */
  138. spinlock_t ns_last_segment_lock;
  139. sector_t ns_last_pseg;
  140. u64 ns_last_seq;
  141. __u64 ns_last_cno;
  142. u64 ns_prot_seq;
  143. u64 ns_prev_seq;
  144. struct nilfs_sc_info *ns_writer;
  145. struct rw_semaphore ns_segctor_sem;
  146. /*
  147. * Following fields are lock free except for the period before
  148. * the_nilfs is initialized.
  149. */
  150. struct inode *ns_dat;
  151. struct inode *ns_cpfile;
  152. struct inode *ns_sufile;
  153. /* Checkpoint tree */
  154. struct rb_root ns_cptree;
  155. spinlock_t ns_cptree_lock;
  156. /* Dirty inode list */
  157. struct list_head ns_dirty_files;
  158. spinlock_t ns_inode_lock;
  159. /* GC inode list */
  160. struct list_head ns_gc_inodes;
  161. /* Inode allocator */
  162. u32 ns_next_generation;
  163. spinlock_t ns_next_gen_lock;
  164. /* Mount options */
  165. unsigned long ns_mount_opt;
  166. uid_t ns_resuid;
  167. gid_t ns_resgid;
  168. unsigned long ns_interval;
  169. unsigned long ns_watermark;
  170. /* Disk layout information (static) */
  171. unsigned int ns_blocksize_bits;
  172. unsigned int ns_blocksize;
  173. unsigned long ns_nsegments;
  174. unsigned long ns_blocks_per_segment;
  175. unsigned long ns_r_segments_percentage;
  176. unsigned long ns_nrsvsegs;
  177. unsigned long ns_first_data_block;
  178. int ns_inode_size;
  179. int ns_first_ino;
  180. u32 ns_crc_seed;
  181. /* /sys/fs/<nilfs>/<device> */
  182. struct kobject ns_dev_kobj;
  183. struct completion ns_dev_kobj_unregister;
  184. struct nilfs_sysfs_dev_subgroups *ns_dev_subgroups;
  185. };
  186. #define THE_NILFS_FNS(bit, name) \
  187. static inline void set_nilfs_##name(struct the_nilfs *nilfs) \
  188. { \
  189. set_bit(THE_NILFS_##bit, &(nilfs)->ns_flags); \
  190. } \
  191. static inline void clear_nilfs_##name(struct the_nilfs *nilfs) \
  192. { \
  193. clear_bit(THE_NILFS_##bit, &(nilfs)->ns_flags); \
  194. } \
  195. static inline int nilfs_##name(struct the_nilfs *nilfs) \
  196. { \
  197. return test_bit(THE_NILFS_##bit, &(nilfs)->ns_flags); \
  198. }
  199. THE_NILFS_FNS(INIT, init)
  200. THE_NILFS_FNS(DISCONTINUED, discontinued)
  201. THE_NILFS_FNS(GC_RUNNING, gc_running)
  202. THE_NILFS_FNS(SB_DIRTY, sb_dirty)
  203. /*
  204. * Mount option operations
  205. */
  206. #define nilfs_clear_opt(nilfs, opt) \
  207. do { (nilfs)->ns_mount_opt &= ~NILFS_MOUNT_##opt; } while (0)
  208. #define nilfs_set_opt(nilfs, opt) \
  209. do { (nilfs)->ns_mount_opt |= NILFS_MOUNT_##opt; } while (0)
  210. #define nilfs_test_opt(nilfs, opt) ((nilfs)->ns_mount_opt & NILFS_MOUNT_##opt)
  211. #define nilfs_write_opt(nilfs, mask, opt) \
  212. do { (nilfs)->ns_mount_opt = \
  213. (((nilfs)->ns_mount_opt & ~NILFS_MOUNT_##mask) | \
  214. NILFS_MOUNT_##opt); \
  215. } while (0)
  216. /**
  217. * struct nilfs_root - nilfs root object
  218. * @cno: checkpoint number
  219. * @rb_node: red-black tree node
  220. * @count: refcount of this structure
  221. * @nilfs: nilfs object
  222. * @ifile: inode file
  223. * @inodes_count: number of inodes
  224. * @blocks_count: number of blocks
  225. * @snapshot_kobj: /sys/fs/<nilfs>/<device>/mounted_snapshots/<snapshot>
  226. * @snapshot_kobj_unregister: completion state for kernel object
  227. */
  228. struct nilfs_root {
  229. __u64 cno;
  230. struct rb_node rb_node;
  231. atomic_t count;
  232. struct the_nilfs *nilfs;
  233. struct inode *ifile;
  234. atomic64_t inodes_count;
  235. atomic64_t blocks_count;
  236. /* /sys/fs/<nilfs>/<device>/mounted_snapshots/<snapshot> */
  237. struct kobject snapshot_kobj;
  238. struct completion snapshot_kobj_unregister;
  239. };
  240. /* Special checkpoint number */
  241. #define NILFS_CPTREE_CURRENT_CNO 0
  242. /* Minimum interval of periodical update of superblocks (in seconds) */
  243. #define NILFS_SB_FREQ 10
  244. static inline int nilfs_sb_need_update(struct the_nilfs *nilfs)
  245. {
  246. u64 t = get_seconds();
  247. return t < nilfs->ns_sbwtime ||
  248. t > nilfs->ns_sbwtime + nilfs->ns_sb_update_freq;
  249. }
  250. static inline int nilfs_sb_will_flip(struct the_nilfs *nilfs)
  251. {
  252. int flip_bits = nilfs->ns_sbwcount & 0x0FL;
  253. return (flip_bits != 0x08 && flip_bits != 0x0F);
  254. }
  255. void nilfs_set_last_segment(struct the_nilfs *, sector_t, u64, __u64);
  256. struct the_nilfs *alloc_nilfs(struct block_device *bdev);
  257. void destroy_nilfs(struct the_nilfs *nilfs);
  258. int init_nilfs(struct the_nilfs *nilfs, struct super_block *sb, char *data);
  259. int load_nilfs(struct the_nilfs *nilfs, struct super_block *sb);
  260. unsigned long nilfs_nrsvsegs(struct the_nilfs *nilfs, unsigned long nsegs);
  261. void nilfs_set_nsegments(struct the_nilfs *nilfs, unsigned long nsegs);
  262. int nilfs_discard_segments(struct the_nilfs *, __u64 *, size_t);
  263. int nilfs_count_free_blocks(struct the_nilfs *, sector_t *);
  264. struct nilfs_root *nilfs_lookup_root(struct the_nilfs *nilfs, __u64 cno);
  265. struct nilfs_root *nilfs_find_or_create_root(struct the_nilfs *nilfs,
  266. __u64 cno);
  267. void nilfs_put_root(struct nilfs_root *root);
  268. int nilfs_near_disk_full(struct the_nilfs *);
  269. void nilfs_fall_back_super_block(struct the_nilfs *);
  270. void nilfs_swap_super_block(struct the_nilfs *);
  271. static inline void nilfs_get_root(struct nilfs_root *root)
  272. {
  273. atomic_inc(&root->count);
  274. }
  275. static inline int nilfs_valid_fs(struct the_nilfs *nilfs)
  276. {
  277. unsigned valid_fs;
  278. down_read(&nilfs->ns_sem);
  279. valid_fs = (nilfs->ns_mount_state & NILFS_VALID_FS);
  280. up_read(&nilfs->ns_sem);
  281. return valid_fs;
  282. }
  283. static inline void
  284. nilfs_get_segment_range(struct the_nilfs *nilfs, __u64 segnum,
  285. sector_t *seg_start, sector_t *seg_end)
  286. {
  287. *seg_start = (sector_t)nilfs->ns_blocks_per_segment * segnum;
  288. *seg_end = *seg_start + nilfs->ns_blocks_per_segment - 1;
  289. if (segnum == 0)
  290. *seg_start = nilfs->ns_first_data_block;
  291. }
  292. static inline sector_t
  293. nilfs_get_segment_start_blocknr(struct the_nilfs *nilfs, __u64 segnum)
  294. {
  295. return (segnum == 0) ? nilfs->ns_first_data_block :
  296. (sector_t)nilfs->ns_blocks_per_segment * segnum;
  297. }
  298. static inline __u64
  299. nilfs_get_segnum_of_block(struct the_nilfs *nilfs, sector_t blocknr)
  300. {
  301. sector_t segnum = blocknr;
  302. sector_div(segnum, nilfs->ns_blocks_per_segment);
  303. return segnum;
  304. }
  305. static inline void
  306. nilfs_terminate_segment(struct the_nilfs *nilfs, sector_t seg_start,
  307. sector_t seg_end)
  308. {
  309. /* terminate the current full segment (used in case of I/O-error) */
  310. nilfs->ns_pseg_offset = seg_end - seg_start + 1;
  311. }
  312. static inline void nilfs_shift_to_next_segment(struct the_nilfs *nilfs)
  313. {
  314. /* move forward with a full segment */
  315. nilfs->ns_segnum = nilfs->ns_nextnum;
  316. nilfs->ns_pseg_offset = 0;
  317. nilfs->ns_seg_seq++;
  318. }
  319. static inline __u64 nilfs_last_cno(struct the_nilfs *nilfs)
  320. {
  321. __u64 cno;
  322. spin_lock(&nilfs->ns_last_segment_lock);
  323. cno = nilfs->ns_last_cno;
  324. spin_unlock(&nilfs->ns_last_segment_lock);
  325. return cno;
  326. }
  327. static inline int nilfs_segment_is_active(struct the_nilfs *nilfs, __u64 n)
  328. {
  329. return n == nilfs->ns_segnum || n == nilfs->ns_nextnum;
  330. }
  331. static inline int nilfs_flush_device(struct the_nilfs *nilfs)
  332. {
  333. int err;
  334. if (!nilfs_test_opt(nilfs, BARRIER) || nilfs->ns_flushed_device)
  335. return 0;
  336. nilfs->ns_flushed_device = 1;
  337. /*
  338. * the store to ns_flushed_device must not be reordered after
  339. * blkdev_issue_flush().
  340. */
  341. smp_wmb();
  342. err = blkdev_issue_flush(nilfs->ns_bdev, GFP_KERNEL, NULL);
  343. if (err != -EIO)
  344. err = 0;
  345. return err;
  346. }
  347. #endif /* _THE_NILFS_H */