blob: f4968145c2a3ee22bdbff5fb7d4e2dd40f6fd392 [file] [log] [blame]
Ryusuke Konishi65b46432009-04-06 19:01:23 -07001/*
2 * the_nilfs.h - the_nilfs shared structure.
3 *
4 * Copyright (C) 2005-2008 Nippon Telegraph and Telephone Corporation.
5 *
6 * This program is free software; you can redistribute it and/or modify
7 * it under the terms of the GNU General Public License as published by
8 * the Free Software Foundation; either version 2 of the License, or
9 * (at your option) any later version.
10 *
11 * This program is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 * GNU General Public License for more details.
15 *
16 * You should have received a copy of the GNU General Public License
17 * along with this program; if not, write to the Free Software
18 * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA
19 *
20 * Written by Ryusuke Konishi <ryusuke@osrg.net>
21 *
22 */
23
24#ifndef _THE_NILFS_H
25#define _THE_NILFS_H
26
27#include <linux/types.h>
28#include <linux/buffer_head.h>
Ryusuke Konishiba65ae42010-08-14 12:59:15 +090029#include <linux/rbtree.h>
Ryusuke Konishi65b46432009-04-06 19:01:23 -070030#include <linux/fs.h>
31#include <linux/blkdev.h>
32#include <linux/backing-dev.h>
Tejun Heo5a0e3ad2010-03-24 17:04:11 +090033#include <linux/slab.h>
Ryusuke Konishi65b46432009-04-06 19:01:23 -070034
Ryusuke Konishi3fd3fe52011-03-09 11:05:08 +090035struct nilfs_sc_info;
36
Ryusuke Konishi65b46432009-04-06 19:01:23 -070037/* the_nilfs struct */
38enum {
39 THE_NILFS_INIT = 0, /* Information from super_block is set */
Ryusuke Konishi65b46432009-04-06 19:01:23 -070040 THE_NILFS_DISCONTINUED, /* 'next' pointer chain has broken */
Jiro SEKIBA1cf58fa2009-09-03 22:24:17 +090041 THE_NILFS_GC_RUNNING, /* gc process is running */
Ryusuke Konishie605f0a2009-12-09 00:57:52 +090042 THE_NILFS_SB_DIRTY, /* super block is dirty */
Ryusuke Konishi65b46432009-04-06 19:01:23 -070043};
44
45/**
46 * struct the_nilfs - struct to supervise multiple nilfs mount points
47 * @ns_flags: flags
Ryusuke Konishi65b46432009-04-06 19:01:23 -070048 * @ns_bdev: block device
Ryusuke Konishi65b46432009-04-06 19:01:23 -070049 * @ns_sem: semaphore for shared states
Ryusuke Konishie339ad32009-04-06 19:01:59 -070050 * @ns_sbh: buffer heads of on-disk super blocks
51 * @ns_sbp: pointers to super block data
Jiro SEKIBAb2ac86e2010-06-28 17:49:33 +090052 * @ns_sbwtime: previous write time of super block
53 * @ns_sbwcount: write count of super block
Ryusuke Konishie339ad32009-04-06 19:01:59 -070054 * @ns_sbsize: size of valid data in super block
Ryusuke Konishi65b46432009-04-06 19:01:23 -070055 * @ns_seg_seq: segment sequence counter
56 * @ns_segnum: index number of the latest full segment.
57 * @ns_nextnum: index number of the full segment index to be used next
58 * @ns_pseg_offset: offset of next partial segment in the current full segment
59 * @ns_cno: next checkpoint number
60 * @ns_ctime: write time of the last segment
61 * @ns_nongc_ctime: write time of the last segment not for cleaner operation
62 * @ns_ndirtyblks: Number of dirty data blocks
63 * @ns_last_segment_lock: lock protecting fields for the latest segment
64 * @ns_last_pseg: start block number of the latest segment
65 * @ns_last_seq: sequence value of the latest segment
66 * @ns_last_cno: checkpoint number of the latest segment
Ryusuke Konishi2c2e52f2009-04-06 19:01:54 -070067 * @ns_prot_seq: least sequence number of segments which must not be reclaimed
Ryusuke Konishi32502042010-06-29 14:42:13 +090068 * @ns_prev_seq: base sequence number used to decide if advance log cursor
Ryusuke Konishi3fd3fe52011-03-09 11:05:08 +090069 * @ns_writer: log writer
70 * @ns_segctor_sem: semaphore protecting log write
Ryusuke Konishi65b46432009-04-06 19:01:23 -070071 * @ns_dat: DAT file inode
72 * @ns_cpfile: checkpoint file inode
73 * @ns_sufile: segusage file inode
Ryusuke Konishiba65ae42010-08-14 12:59:15 +090074 * @ns_cptree: rb-tree of all mounted checkpoints (nilfs_root)
75 * @ns_cptree_lock: lock protecting @ns_cptree
Ryusuke Konishi693dd322011-03-09 11:05:07 +090076 * @ns_dirty_files: list of dirty files
77 * @ns_inode_lock: lock protecting @ns_dirty_files
Ryusuke Konishi65b46432009-04-06 19:01:23 -070078 * @ns_gc_inodes: dummy inodes to keep live blocks
Ryusuke Konishi9b1fc4e42011-03-09 11:05:08 +090079 * @ns_next_generation: next generation number for inodes
80 * @ns_next_gen_lock: lock protecting @ns_next_generation
Ryusuke Konishi3b2ce582011-03-09 11:05:07 +090081 * @ns_mount_opt: mount options
Ryusuke Konishi574e6c32011-03-09 11:05:07 +090082 * @ns_resuid: uid for reserved blocks
83 * @ns_resgid: gid for reserved blocks
84 * @ns_interval: checkpoint creation interval
85 * @ns_watermark: watermark for the number of dirty buffers
Ryusuke Konishi65b46432009-04-06 19:01:23 -070086 * @ns_blocksize_bits: bit length of block size
Ryusuke Konishi92c60cc2010-05-23 00:17:48 +090087 * @ns_blocksize: block size
Ryusuke Konishi65b46432009-04-06 19:01:23 -070088 * @ns_nsegments: number of segments in filesystem
89 * @ns_blocks_per_segment: number of blocks per segment
90 * @ns_r_segments_percentage: reserved segments percentage
91 * @ns_nrsvsegs: number of reserved segments
92 * @ns_first_data_block: block number of first data block
93 * @ns_inode_size: size of on-disk inode
94 * @ns_first_ino: first not-special inode number
95 * @ns_crc_seed: seed value of CRC32 calculation
96 */
97struct the_nilfs {
98 unsigned long ns_flags;
Ryusuke Konishi65b46432009-04-06 19:01:23 -070099
100 struct block_device *ns_bdev;
Ryusuke Konishi65b46432009-04-06 19:01:23 -0700101 struct rw_semaphore ns_sem;
Ryusuke Konishi65b46432009-04-06 19:01:23 -0700102
Ryusuke Konishie59399d2009-06-08 01:39:32 +0900103 /*
Ryusuke Konishi65b46432009-04-06 19:01:23 -0700104 * used for
105 * - loading the latest checkpoint exclusively.
106 * - allocating a new full segment.
107 * - protecting s_dirt in the super_block struct
108 * (see nilfs_write_super) and the following fields.
109 */
Ryusuke Konishie339ad32009-04-06 19:01:59 -0700110 struct buffer_head *ns_sbh[2];
111 struct nilfs_super_block *ns_sbp[2];
Jiro SEKIBAb2ac86e2010-06-28 17:49:33 +0900112 time_t ns_sbwtime;
113 unsigned ns_sbwcount;
Ryusuke Konishie339ad32009-04-06 19:01:59 -0700114 unsigned ns_sbsize;
Ryusuke Konishi65b46432009-04-06 19:01:23 -0700115 unsigned ns_mount_state;
Ryusuke Konishi65b46432009-04-06 19:01:23 -0700116
117 /*
118 * Following fields are dedicated to a writable FS-instance.
119 * Except for the period seeking checkpoint, code outside the segment
Ryusuke Konishi47420c72009-04-06 19:01:45 -0700120 * constructor must lock a segment semaphore while accessing these
121 * fields.
Ryusuke Konishi65b46432009-04-06 19:01:23 -0700122 * The writable FS-instance is sole during a lifetime of the_nilfs.
123 */
124 u64 ns_seg_seq;
125 __u64 ns_segnum;
126 __u64 ns_nextnum;
127 unsigned long ns_pseg_offset;
128 __u64 ns_cno;
129 time_t ns_ctime;
130 time_t ns_nongc_ctime;
131 atomic_t ns_ndirtyblks;
132
133 /*
134 * The following fields hold information on the latest partial segment
135 * written to disk with a super root. These fields are protected by
136 * ns_last_segment_lock.
137 */
138 spinlock_t ns_last_segment_lock;
139 sector_t ns_last_pseg;
140 u64 ns_last_seq;
141 __u64 ns_last_cno;
Ryusuke Konishi2c2e52f2009-04-06 19:01:54 -0700142 u64 ns_prot_seq;
Ryusuke Konishi32502042010-06-29 14:42:13 +0900143 u64 ns_prev_seq;
Ryusuke Konishi65b46432009-04-06 19:01:23 -0700144
Ryusuke Konishi3fd3fe52011-03-09 11:05:08 +0900145 struct nilfs_sc_info *ns_writer;
Ryusuke Konishi65b46432009-04-06 19:01:23 -0700146 struct rw_semaphore ns_segctor_sem;
147
148 /*
149 * Following fields are lock free except for the period before
150 * the_nilfs is initialized.
151 */
152 struct inode *ns_dat;
153 struct inode *ns_cpfile;
154 struct inode *ns_sufile;
Ryusuke Konishi65b46432009-04-06 19:01:23 -0700155
Ryusuke Konishiba65ae42010-08-14 12:59:15 +0900156 /* Checkpoint tree */
157 struct rb_root ns_cptree;
158 spinlock_t ns_cptree_lock;
159
Ryusuke Konishi693dd322011-03-09 11:05:07 +0900160 /* Dirty inode list */
161 struct list_head ns_dirty_files;
162 spinlock_t ns_inode_lock;
163
Ryusuke Konishi263d90c2010-08-20 19:06:11 +0900164 /* GC inode list */
Ryusuke Konishi65b46432009-04-06 19:01:23 -0700165 struct list_head ns_gc_inodes;
Ryusuke Konishi65b46432009-04-06 19:01:23 -0700166
Ryusuke Konishi9b1fc4e42011-03-09 11:05:08 +0900167 /* Inode allocator */
168 u32 ns_next_generation;
169 spinlock_t ns_next_gen_lock;
170
Ryusuke Konishi3b2ce582011-03-09 11:05:07 +0900171 /* Mount options */
172 unsigned long ns_mount_opt;
173
Ryusuke Konishi574e6c32011-03-09 11:05:07 +0900174 uid_t ns_resuid;
175 gid_t ns_resgid;
176 unsigned long ns_interval;
177 unsigned long ns_watermark;
178
Ryusuke Konishi65b46432009-04-06 19:01:23 -0700179 /* Disk layout information (static) */
180 unsigned int ns_blocksize_bits;
Ryusuke Konishi92c60cc2010-05-23 00:17:48 +0900181 unsigned int ns_blocksize;
Ryusuke Konishi65b46432009-04-06 19:01:23 -0700182 unsigned long ns_nsegments;
183 unsigned long ns_blocks_per_segment;
184 unsigned long ns_r_segments_percentage;
185 unsigned long ns_nrsvsegs;
186 unsigned long ns_first_data_block;
187 int ns_inode_size;
188 int ns_first_ino;
189 u32 ns_crc_seed;
190};
191
Ryusuke Konishi65b46432009-04-06 19:01:23 -0700192#define THE_NILFS_FNS(bit, name) \
193static inline void set_nilfs_##name(struct the_nilfs *nilfs) \
194{ \
195 set_bit(THE_NILFS_##bit, &(nilfs)->ns_flags); \
196} \
197static inline void clear_nilfs_##name(struct the_nilfs *nilfs) \
198{ \
199 clear_bit(THE_NILFS_##bit, &(nilfs)->ns_flags); \
200} \
201static inline int nilfs_##name(struct the_nilfs *nilfs) \
202{ \
203 return test_bit(THE_NILFS_##bit, &(nilfs)->ns_flags); \
204}
205
206THE_NILFS_FNS(INIT, init)
Ryusuke Konishi65b46432009-04-06 19:01:23 -0700207THE_NILFS_FNS(DISCONTINUED, discontinued)
Jiro SEKIBA1cf58fa2009-09-03 22:24:17 +0900208THE_NILFS_FNS(GC_RUNNING, gc_running)
Ryusuke Konishie605f0a2009-12-09 00:57:52 +0900209THE_NILFS_FNS(SB_DIRTY, sb_dirty)
Ryusuke Konishi65b46432009-04-06 19:01:23 -0700210
Ryusuke Konishi3b2ce582011-03-09 11:05:07 +0900211/*
212 * Mount option operations
213 */
214#define nilfs_clear_opt(nilfs, opt) \
215 do { (nilfs)->ns_mount_opt &= ~NILFS_MOUNT_##opt; } while (0)
216#define nilfs_set_opt(nilfs, opt) \
217 do { (nilfs)->ns_mount_opt |= NILFS_MOUNT_##opt; } while (0)
218#define nilfs_test_opt(nilfs, opt) ((nilfs)->ns_mount_opt & NILFS_MOUNT_##opt)
219#define nilfs_write_opt(nilfs, mask, opt) \
220 do { (nilfs)->ns_mount_opt = \
221 (((nilfs)->ns_mount_opt & ~NILFS_MOUNT_##mask) | \
222 NILFS_MOUNT_##opt); \
223 } while (0)
224
Ryusuke Konishiba65ae42010-08-14 12:59:15 +0900225/**
226 * struct nilfs_root - nilfs root object
227 * @cno: checkpoint number
228 * @rb_node: red-black tree node
229 * @count: refcount of this structure
230 * @nilfs: nilfs object
231 * @ifile: inode file
232 * @root: root inode
233 * @inodes_count: number of inodes
234 * @blocks_count: number of blocks (Reserved)
235 */
236struct nilfs_root {
237 __u64 cno;
238 struct rb_node rb_node;
239
240 atomic_t count;
241 struct the_nilfs *nilfs;
242 struct inode *ifile;
243
244 atomic_t inodes_count;
245 atomic_t blocks_count;
246};
247
248/* Special checkpoint number */
249#define NILFS_CPTREE_CURRENT_CNO 0
250
Ryusuke Konishie339ad32009-04-06 19:01:59 -0700251/* Minimum interval of periodical update of superblocks (in seconds) */
252#define NILFS_SB_FREQ 10
Ryusuke Konishie339ad32009-04-06 19:01:59 -0700253
Jiro SEKIBA79efdd92009-07-23 01:26:34 +0900254static inline int nilfs_sb_need_update(struct the_nilfs *nilfs)
255{
256 u64 t = get_seconds();
Jiro SEKIBAb2ac86e2010-06-28 17:49:33 +0900257 return t < nilfs->ns_sbwtime || t > nilfs->ns_sbwtime + NILFS_SB_FREQ;
Jiro SEKIBA79efdd92009-07-23 01:26:34 +0900258}
259
Jiro SEKIBAb2ac86e2010-06-28 17:49:33 +0900260static inline int nilfs_sb_will_flip(struct the_nilfs *nilfs)
Jiro SEKIBA79efdd92009-07-23 01:26:34 +0900261{
Jiro SEKIBAb2ac86e2010-06-28 17:49:33 +0900262 int flip_bits = nilfs->ns_sbwcount & 0x0FL;
263 return (flip_bits != 0x08 && flip_bits != 0x0F);
Jiro SEKIBA79efdd92009-07-23 01:26:34 +0900264}
265
Ryusuke Konishi65b46432009-04-06 19:01:23 -0700266void nilfs_set_last_segment(struct the_nilfs *, sector_t, u64, __u64);
Ryusuke Konishi348fe8d2010-09-09 02:07:56 +0900267struct the_nilfs *alloc_nilfs(struct block_device *bdev);
268void destroy_nilfs(struct the_nilfs *nilfs);
Ryusuke Konishif7545142011-03-09 11:05:08 +0900269int init_nilfs(struct the_nilfs *nilfs, struct super_block *sb, char *data);
270int load_nilfs(struct the_nilfs *nilfs, struct super_block *sb);
Jiro SEKIBAe902ec92010-01-30 18:06:35 +0900271int nilfs_discard_segments(struct the_nilfs *, __u64 *, size_t);
Ryusuke Konishi65b46432009-04-06 19:01:23 -0700272int nilfs_count_free_blocks(struct the_nilfs *, sector_t *);
Ryusuke Konishiba65ae42010-08-14 12:59:15 +0900273struct nilfs_root *nilfs_lookup_root(struct the_nilfs *nilfs, __u64 cno);
274struct nilfs_root *nilfs_find_or_create_root(struct the_nilfs *nilfs,
275 __u64 cno);
276void nilfs_put_root(struct nilfs_root *root);
Ryusuke Konishi65b46432009-04-06 19:01:23 -0700277int nilfs_near_disk_full(struct the_nilfs *);
Ryusuke Konishie339ad32009-04-06 19:01:59 -0700278void nilfs_fall_back_super_block(struct the_nilfs *);
279void nilfs_swap_super_block(struct the_nilfs *);
Ryusuke Konishi65b46432009-04-06 19:01:23 -0700280
281
Ryusuke Konishiba65ae42010-08-14 12:59:15 +0900282static inline void nilfs_get_root(struct nilfs_root *root)
283{
284 atomic_inc(&root->count);
285}
286
Ryusuke Konishia057d2c2009-11-19 19:58:46 +0900287static inline int nilfs_valid_fs(struct the_nilfs *nilfs)
288{
289 unsigned valid_fs;
290
291 down_read(&nilfs->ns_sem);
292 valid_fs = (nilfs->ns_mount_state & NILFS_VALID_FS);
293 up_read(&nilfs->ns_sem);
294 return valid_fs;
295}
296
Ryusuke Konishi65b46432009-04-06 19:01:23 -0700297static inline void
298nilfs_get_segment_range(struct the_nilfs *nilfs, __u64 segnum,
299 sector_t *seg_start, sector_t *seg_end)
300{
301 *seg_start = (sector_t)nilfs->ns_blocks_per_segment * segnum;
302 *seg_end = *seg_start + nilfs->ns_blocks_per_segment - 1;
303 if (segnum == 0)
304 *seg_start = nilfs->ns_first_data_block;
305}
306
307static inline sector_t
308nilfs_get_segment_start_blocknr(struct the_nilfs *nilfs, __u64 segnum)
309{
310 return (segnum == 0) ? nilfs->ns_first_data_block :
311 (sector_t)nilfs->ns_blocks_per_segment * segnum;
312}
313
314static inline __u64
315nilfs_get_segnum_of_block(struct the_nilfs *nilfs, sector_t blocknr)
316{
317 sector_t segnum = blocknr;
318
319 sector_div(segnum, nilfs->ns_blocks_per_segment);
320 return segnum;
321}
322
323static inline void
324nilfs_terminate_segment(struct the_nilfs *nilfs, sector_t seg_start,
325 sector_t seg_end)
326{
327 /* terminate the current full segment (used in case of I/O-error) */
328 nilfs->ns_pseg_offset = seg_end - seg_start + 1;
329}
330
331static inline void nilfs_shift_to_next_segment(struct the_nilfs *nilfs)
332{
333 /* move forward with a full segment */
334 nilfs->ns_segnum = nilfs->ns_nextnum;
335 nilfs->ns_pseg_offset = 0;
336 nilfs->ns_seg_seq++;
337}
338
339static inline __u64 nilfs_last_cno(struct the_nilfs *nilfs)
340{
341 __u64 cno;
342
343 spin_lock(&nilfs->ns_last_segment_lock);
344 cno = nilfs->ns_last_cno;
345 spin_unlock(&nilfs->ns_last_segment_lock);
346 return cno;
347}
348
Ryusuke Konishicece5522009-04-06 19:01:58 -0700349static inline int nilfs_segment_is_active(struct the_nilfs *nilfs, __u64 n)
350{
351 return n == nilfs->ns_segnum || n == nilfs->ns_nextnum;
352}
353
Ryusuke Konishi65b46432009-04-06 19:01:23 -0700354#endif /* _THE_NILFS_H */