blob: 06d2548d436d093602b808c48f21aa074c6d429c [file] [log] [blame]
Ryusuke Konishi65b46432009-04-06 19:01:23 -07001/*
2 * the_nilfs.h - the_nilfs shared structure.
3 *
4 * Copyright (C) 2005-2008 Nippon Telegraph and Telephone Corporation.
5 *
6 * This program is free software; you can redistribute it and/or modify
7 * it under the terms of the GNU General Public License as published by
8 * the Free Software Foundation; either version 2 of the License, or
9 * (at your option) any later version.
10 *
11 * This program is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 * GNU General Public License for more details.
15 *
Ryusuke Konishi4b420ab2016-05-23 16:23:09 -070016 * Written by Ryusuke Konishi.
Ryusuke Konishi65b46432009-04-06 19:01:23 -070017 *
18 */
19
20#ifndef _THE_NILFS_H
21#define _THE_NILFS_H
22
23#include <linux/types.h>
24#include <linux/buffer_head.h>
Ryusuke Konishiba65ae42010-08-14 12:59:15 +090025#include <linux/rbtree.h>
Ryusuke Konishi65b46432009-04-06 19:01:23 -070026#include <linux/fs.h>
27#include <linux/blkdev.h>
28#include <linux/backing-dev.h>
Tejun Heo5a0e3ad2010-03-24 17:04:11 +090029#include <linux/slab.h>
Ryusuke Konishi65b46432009-04-06 19:01:23 -070030
Ryusuke Konishi3fd3fe52011-03-09 11:05:08 +090031struct nilfs_sc_info;
Vyacheslav Dubeykocaa05d42014-08-08 14:20:42 -070032struct nilfs_sysfs_dev_subgroups;
Ryusuke Konishi3fd3fe52011-03-09 11:05:08 +090033
Ryusuke Konishi65b46432009-04-06 19:01:23 -070034/* the_nilfs struct */
35enum {
36 THE_NILFS_INIT = 0, /* Information from super_block is set */
Ryusuke Konishi65b46432009-04-06 19:01:23 -070037 THE_NILFS_DISCONTINUED, /* 'next' pointer chain has broken */
Jiro SEKIBA1cf58fa2009-09-03 22:24:17 +090038 THE_NILFS_GC_RUNNING, /* gc process is running */
Ryusuke Konishie605f0a2009-12-09 00:57:52 +090039 THE_NILFS_SB_DIRTY, /* super block is dirty */
Ryusuke Konishi65b46432009-04-06 19:01:23 -070040};
41
42/**
43 * struct the_nilfs - struct to supervise multiple nilfs mount points
44 * @ns_flags: flags
Andreas Rohnere2c76172014-10-13 15:53:20 -070045 * @ns_flushed_device: flag indicating if all volatile data was flushed
Ryusuke Konishi65b46432009-04-06 19:01:23 -070046 * @ns_bdev: block device
Ryusuke Konishi65b46432009-04-06 19:01:23 -070047 * @ns_sem: semaphore for shared states
Ryusuke Konishi572d8b32012-07-30 14:42:07 -070048 * @ns_snapshot_mount_mutex: mutex to protect snapshot mounts
Ryusuke Konishie339ad32009-04-06 19:01:59 -070049 * @ns_sbh: buffer heads of on-disk super blocks
50 * @ns_sbp: pointers to super block data
Jiro SEKIBAb2ac86e2010-06-28 17:49:33 +090051 * @ns_sbwtime: previous write time of super block
52 * @ns_sbwcount: write count of super block
Ryusuke Konishie339ad32009-04-06 19:01:59 -070053 * @ns_sbsize: size of valid data in super block
Vyacheslav Dubeyko6b0f3392012-07-30 14:42:02 -070054 * @ns_mount_state: file system state
Vyacheslav Dubeykocaa05d42014-08-08 14:20:42 -070055 * @ns_sb_update_freq: interval of periodical update of superblocks (in seconds)
Ryusuke Konishi65b46432009-04-06 19:01:23 -070056 * @ns_seg_seq: segment sequence counter
57 * @ns_segnum: index number of the latest full segment.
58 * @ns_nextnum: index number of the full segment index to be used next
59 * @ns_pseg_offset: offset of next partial segment in the current full segment
60 * @ns_cno: next checkpoint number
61 * @ns_ctime: write time of the last segment
62 * @ns_nongc_ctime: write time of the last segment not for cleaner operation
63 * @ns_ndirtyblks: Number of dirty data blocks
64 * @ns_last_segment_lock: lock protecting fields for the latest segment
65 * @ns_last_pseg: start block number of the latest segment
66 * @ns_last_seq: sequence value of the latest segment
67 * @ns_last_cno: checkpoint number of the latest segment
Ryusuke Konishi2c2e52f2009-04-06 19:01:54 -070068 * @ns_prot_seq: least sequence number of segments which must not be reclaimed
Ryusuke Konishi32502042010-06-29 14:42:13 +090069 * @ns_prev_seq: base sequence number used to decide if advance log cursor
Ryusuke Konishi3fd3fe52011-03-09 11:05:08 +090070 * @ns_writer: log writer
71 * @ns_segctor_sem: semaphore protecting log write
Ryusuke Konishi65b46432009-04-06 19:01:23 -070072 * @ns_dat: DAT file inode
73 * @ns_cpfile: checkpoint file inode
74 * @ns_sufile: segusage file inode
Ryusuke Konishiba65ae42010-08-14 12:59:15 +090075 * @ns_cptree: rb-tree of all mounted checkpoints (nilfs_root)
76 * @ns_cptree_lock: lock protecting @ns_cptree
Ryusuke Konishi693dd322011-03-09 11:05:07 +090077 * @ns_dirty_files: list of dirty files
78 * @ns_inode_lock: lock protecting @ns_dirty_files
Ryusuke Konishi65b46432009-04-06 19:01:23 -070079 * @ns_gc_inodes: dummy inodes to keep live blocks
Ryusuke Konishi9b1fc4e42011-03-09 11:05:08 +090080 * @ns_next_generation: next generation number for inodes
81 * @ns_next_gen_lock: lock protecting @ns_next_generation
Ryusuke Konishi3b2ce582011-03-09 11:05:07 +090082 * @ns_mount_opt: mount options
Ryusuke Konishi574e6c32011-03-09 11:05:07 +090083 * @ns_resuid: uid for reserved blocks
84 * @ns_resgid: gid for reserved blocks
85 * @ns_interval: checkpoint creation interval
86 * @ns_watermark: watermark for the number of dirty buffers
Ryusuke Konishi65b46432009-04-06 19:01:23 -070087 * @ns_blocksize_bits: bit length of block size
Ryusuke Konishi92c60cc2010-05-23 00:17:48 +090088 * @ns_blocksize: block size
Ryusuke Konishi65b46432009-04-06 19:01:23 -070089 * @ns_nsegments: number of segments in filesystem
90 * @ns_blocks_per_segment: number of blocks per segment
91 * @ns_r_segments_percentage: reserved segments percentage
92 * @ns_nrsvsegs: number of reserved segments
93 * @ns_first_data_block: block number of first data block
94 * @ns_inode_size: size of on-disk inode
95 * @ns_first_ino: first not-special inode number
96 * @ns_crc_seed: seed value of CRC32 calculation
Vyacheslav Dubeykoda7141f2014-08-08 14:20:39 -070097 * @ns_dev_kobj: /sys/fs/<nilfs>/<device>
98 * @ns_dev_kobj_unregister: completion state
Vyacheslav Dubeykocaa05d42014-08-08 14:20:42 -070099 * @ns_dev_subgroups: <device> subgroups pointer
Ryusuke Konishi65b46432009-04-06 19:01:23 -0700100 */
101struct the_nilfs {
102 unsigned long ns_flags;
Andreas Rohnere2c76172014-10-13 15:53:20 -0700103 int ns_flushed_device;
Ryusuke Konishi65b46432009-04-06 19:01:23 -0700104
105 struct block_device *ns_bdev;
Ryusuke Konishi65b46432009-04-06 19:01:23 -0700106 struct rw_semaphore ns_sem;
Ryusuke Konishi572d8b32012-07-30 14:42:07 -0700107 struct mutex ns_snapshot_mount_mutex;
Ryusuke Konishi65b46432009-04-06 19:01:23 -0700108
Ryusuke Konishie59399d2009-06-08 01:39:32 +0900109 /*
Ryusuke Konishi65b46432009-04-06 19:01:23 -0700110 * used for
111 * - loading the latest checkpoint exclusively.
112 * - allocating a new full segment.
Ryusuke Konishi65b46432009-04-06 19:01:23 -0700113 */
Ryusuke Konishie339ad32009-04-06 19:01:59 -0700114 struct buffer_head *ns_sbh[2];
115 struct nilfs_super_block *ns_sbp[2];
Jiro SEKIBAb2ac86e2010-06-28 17:49:33 +0900116 time_t ns_sbwtime;
Ryusuke Konishi0c6c44c2016-05-23 16:23:39 -0700117 unsigned int ns_sbwcount;
118 unsigned int ns_sbsize;
119 unsigned int ns_mount_state;
120 unsigned int ns_sb_update_freq;
Ryusuke Konishi65b46432009-04-06 19:01:23 -0700121
122 /*
123 * Following fields are dedicated to a writable FS-instance.
124 * Except for the period seeking checkpoint, code outside the segment
Ryusuke Konishi47420c72009-04-06 19:01:45 -0700125 * constructor must lock a segment semaphore while accessing these
126 * fields.
Ryusuke Konishi65b46432009-04-06 19:01:23 -0700127 * The writable FS-instance is sole during a lifetime of the_nilfs.
128 */
129 u64 ns_seg_seq;
130 __u64 ns_segnum;
131 __u64 ns_nextnum;
132 unsigned long ns_pseg_offset;
133 __u64 ns_cno;
134 time_t ns_ctime;
135 time_t ns_nongc_ctime;
136 atomic_t ns_ndirtyblks;
137
138 /*
139 * The following fields hold information on the latest partial segment
140 * written to disk with a super root. These fields are protected by
141 * ns_last_segment_lock.
142 */
143 spinlock_t ns_last_segment_lock;
144 sector_t ns_last_pseg;
145 u64 ns_last_seq;
146 __u64 ns_last_cno;
Ryusuke Konishi2c2e52f2009-04-06 19:01:54 -0700147 u64 ns_prot_seq;
Ryusuke Konishi32502042010-06-29 14:42:13 +0900148 u64 ns_prev_seq;
Ryusuke Konishi65b46432009-04-06 19:01:23 -0700149
Ryusuke Konishi3fd3fe52011-03-09 11:05:08 +0900150 struct nilfs_sc_info *ns_writer;
Ryusuke Konishi65b46432009-04-06 19:01:23 -0700151 struct rw_semaphore ns_segctor_sem;
152
153 /*
154 * Following fields are lock free except for the period before
155 * the_nilfs is initialized.
156 */
157 struct inode *ns_dat;
158 struct inode *ns_cpfile;
159 struct inode *ns_sufile;
Ryusuke Konishi65b46432009-04-06 19:01:23 -0700160
Ryusuke Konishiba65ae42010-08-14 12:59:15 +0900161 /* Checkpoint tree */
162 struct rb_root ns_cptree;
163 spinlock_t ns_cptree_lock;
164
Ryusuke Konishi693dd322011-03-09 11:05:07 +0900165 /* Dirty inode list */
166 struct list_head ns_dirty_files;
167 spinlock_t ns_inode_lock;
168
Ryusuke Konishi263d90c2010-08-20 19:06:11 +0900169 /* GC inode list */
Ryusuke Konishi65b46432009-04-06 19:01:23 -0700170 struct list_head ns_gc_inodes;
Ryusuke Konishi65b46432009-04-06 19:01:23 -0700171
Ryusuke Konishi9b1fc4e42011-03-09 11:05:08 +0900172 /* Inode allocator */
173 u32 ns_next_generation;
174 spinlock_t ns_next_gen_lock;
175
Ryusuke Konishi3b2ce582011-03-09 11:05:07 +0900176 /* Mount options */
177 unsigned long ns_mount_opt;
178
Ryusuke Konishi574e6c32011-03-09 11:05:07 +0900179 uid_t ns_resuid;
180 gid_t ns_resgid;
181 unsigned long ns_interval;
182 unsigned long ns_watermark;
183
Ryusuke Konishi65b46432009-04-06 19:01:23 -0700184 /* Disk layout information (static) */
185 unsigned int ns_blocksize_bits;
Ryusuke Konishi92c60cc2010-05-23 00:17:48 +0900186 unsigned int ns_blocksize;
Ryusuke Konishi65b46432009-04-06 19:01:23 -0700187 unsigned long ns_nsegments;
188 unsigned long ns_blocks_per_segment;
189 unsigned long ns_r_segments_percentage;
190 unsigned long ns_nrsvsegs;
191 unsigned long ns_first_data_block;
192 int ns_inode_size;
193 int ns_first_ino;
194 u32 ns_crc_seed;
Vyacheslav Dubeykoda7141f2014-08-08 14:20:39 -0700195
196 /* /sys/fs/<nilfs>/<device> */
197 struct kobject ns_dev_kobj;
198 struct completion ns_dev_kobj_unregister;
Vyacheslav Dubeykocaa05d42014-08-08 14:20:42 -0700199 struct nilfs_sysfs_dev_subgroups *ns_dev_subgroups;
Ryusuke Konishi65b46432009-04-06 19:01:23 -0700200};
201
Ryusuke Konishi65b46432009-04-06 19:01:23 -0700202#define THE_NILFS_FNS(bit, name) \
203static inline void set_nilfs_##name(struct the_nilfs *nilfs) \
204{ \
205 set_bit(THE_NILFS_##bit, &(nilfs)->ns_flags); \
206} \
207static inline void clear_nilfs_##name(struct the_nilfs *nilfs) \
208{ \
209 clear_bit(THE_NILFS_##bit, &(nilfs)->ns_flags); \
210} \
211static inline int nilfs_##name(struct the_nilfs *nilfs) \
212{ \
213 return test_bit(THE_NILFS_##bit, &(nilfs)->ns_flags); \
214}
215
216THE_NILFS_FNS(INIT, init)
Ryusuke Konishi65b46432009-04-06 19:01:23 -0700217THE_NILFS_FNS(DISCONTINUED, discontinued)
Jiro SEKIBA1cf58fa2009-09-03 22:24:17 +0900218THE_NILFS_FNS(GC_RUNNING, gc_running)
Ryusuke Konishie605f0a2009-12-09 00:57:52 +0900219THE_NILFS_FNS(SB_DIRTY, sb_dirty)
Ryusuke Konishi65b46432009-04-06 19:01:23 -0700220
Ryusuke Konishi3b2ce582011-03-09 11:05:07 +0900221/*
222 * Mount option operations
223 */
224#define nilfs_clear_opt(nilfs, opt) \
225 do { (nilfs)->ns_mount_opt &= ~NILFS_MOUNT_##opt; } while (0)
226#define nilfs_set_opt(nilfs, opt) \
227 do { (nilfs)->ns_mount_opt |= NILFS_MOUNT_##opt; } while (0)
228#define nilfs_test_opt(nilfs, opt) ((nilfs)->ns_mount_opt & NILFS_MOUNT_##opt)
229#define nilfs_write_opt(nilfs, mask, opt) \
230 do { (nilfs)->ns_mount_opt = \
231 (((nilfs)->ns_mount_opt & ~NILFS_MOUNT_##mask) | \
232 NILFS_MOUNT_##opt); \
233 } while (0)
234
Ryusuke Konishiba65ae42010-08-14 12:59:15 +0900235/**
236 * struct nilfs_root - nilfs root object
237 * @cno: checkpoint number
238 * @rb_node: red-black tree node
239 * @count: refcount of this structure
240 * @nilfs: nilfs object
241 * @ifile: inode file
Ryusuke Konishiba65ae42010-08-14 12:59:15 +0900242 * @inodes_count: number of inodes
Vyacheslav Dubeykof5974c82012-07-30 14:42:10 -0700243 * @blocks_count: number of blocks
Vyacheslav Dubeykoa5a73322014-08-08 14:20:52 -0700244 * @snapshot_kobj: /sys/fs/<nilfs>/<device>/mounted_snapshots/<snapshot>
245 * @snapshot_kobj_unregister: completion state for kernel object
Ryusuke Konishiba65ae42010-08-14 12:59:15 +0900246 */
247struct nilfs_root {
248 __u64 cno;
249 struct rb_node rb_node;
250
251 atomic_t count;
252 struct the_nilfs *nilfs;
253 struct inode *ifile;
254
Vyacheslav Dubeykoe5f7f842013-07-03 15:08:06 -0700255 atomic64_t inodes_count;
256 atomic64_t blocks_count;
Vyacheslav Dubeykoa5a73322014-08-08 14:20:52 -0700257
258 /* /sys/fs/<nilfs>/<device>/mounted_snapshots/<snapshot> */
259 struct kobject snapshot_kobj;
260 struct completion snapshot_kobj_unregister;
Ryusuke Konishiba65ae42010-08-14 12:59:15 +0900261};
262
263/* Special checkpoint number */
264#define NILFS_CPTREE_CURRENT_CNO 0
265
Ryusuke Konishie339ad32009-04-06 19:01:59 -0700266/* Minimum interval of periodical update of superblocks (in seconds) */
267#define NILFS_SB_FREQ 10
Ryusuke Konishie339ad32009-04-06 19:01:59 -0700268
Jiro SEKIBA79efdd92009-07-23 01:26:34 +0900269static inline int nilfs_sb_need_update(struct the_nilfs *nilfs)
270{
271 u64 t = get_seconds();
Ryusuke Konishi4ad364c2016-05-23 16:23:25 -0700272
Vyacheslav Dubeykocaa05d42014-08-08 14:20:42 -0700273 return t < nilfs->ns_sbwtime ||
274 t > nilfs->ns_sbwtime + nilfs->ns_sb_update_freq;
Jiro SEKIBA79efdd92009-07-23 01:26:34 +0900275}
276
Jiro SEKIBAb2ac86e2010-06-28 17:49:33 +0900277static inline int nilfs_sb_will_flip(struct the_nilfs *nilfs)
Jiro SEKIBA79efdd92009-07-23 01:26:34 +0900278{
Jiro SEKIBAb2ac86e2010-06-28 17:49:33 +0900279 int flip_bits = nilfs->ns_sbwcount & 0x0FL;
Ryusuke Konishi4ad364c2016-05-23 16:23:25 -0700280
Jiro SEKIBAb2ac86e2010-06-28 17:49:33 +0900281 return (flip_bits != 0x08 && flip_bits != 0x0F);
Jiro SEKIBA79efdd92009-07-23 01:26:34 +0900282}
283
Ryusuke Konishi65b46432009-04-06 19:01:23 -0700284void nilfs_set_last_segment(struct the_nilfs *, sector_t, u64, __u64);
Ryusuke Konishi348fe8d2010-09-09 02:07:56 +0900285struct the_nilfs *alloc_nilfs(struct block_device *bdev);
286void destroy_nilfs(struct the_nilfs *nilfs);
Ryusuke Konishif7545142011-03-09 11:05:08 +0900287int init_nilfs(struct the_nilfs *nilfs, struct super_block *sb, char *data);
288int load_nilfs(struct the_nilfs *nilfs, struct super_block *sb);
Ryusuke Konishi4e33f9e2011-05-05 01:23:58 +0900289unsigned long nilfs_nrsvsegs(struct the_nilfs *nilfs, unsigned long nsegs);
290void nilfs_set_nsegments(struct the_nilfs *nilfs, unsigned long nsegs);
Jiro SEKIBAe902ec92010-01-30 18:06:35 +0900291int nilfs_discard_segments(struct the_nilfs *, __u64 *, size_t);
Ryusuke Konishi65b46432009-04-06 19:01:23 -0700292int nilfs_count_free_blocks(struct the_nilfs *, sector_t *);
Ryusuke Konishiba65ae42010-08-14 12:59:15 +0900293struct nilfs_root *nilfs_lookup_root(struct the_nilfs *nilfs, __u64 cno);
294struct nilfs_root *nilfs_find_or_create_root(struct the_nilfs *nilfs,
295 __u64 cno);
296void nilfs_put_root(struct nilfs_root *root);
Ryusuke Konishi65b46432009-04-06 19:01:23 -0700297int nilfs_near_disk_full(struct the_nilfs *);
Ryusuke Konishie339ad32009-04-06 19:01:59 -0700298void nilfs_fall_back_super_block(struct the_nilfs *);
299void nilfs_swap_super_block(struct the_nilfs *);
Ryusuke Konishi65b46432009-04-06 19:01:23 -0700300
301
Ryusuke Konishiba65ae42010-08-14 12:59:15 +0900302static inline void nilfs_get_root(struct nilfs_root *root)
303{
304 atomic_inc(&root->count);
305}
306
Ryusuke Konishia057d2c2009-11-19 19:58:46 +0900307static inline int nilfs_valid_fs(struct the_nilfs *nilfs)
308{
Ryusuke Konishi0c6c44c2016-05-23 16:23:39 -0700309 unsigned int valid_fs;
Ryusuke Konishia057d2c2009-11-19 19:58:46 +0900310
311 down_read(&nilfs->ns_sem);
312 valid_fs = (nilfs->ns_mount_state & NILFS_VALID_FS);
313 up_read(&nilfs->ns_sem);
314 return valid_fs;
315}
316
Ryusuke Konishi65b46432009-04-06 19:01:23 -0700317static inline void
318nilfs_get_segment_range(struct the_nilfs *nilfs, __u64 segnum,
319 sector_t *seg_start, sector_t *seg_end)
320{
321 *seg_start = (sector_t)nilfs->ns_blocks_per_segment * segnum;
322 *seg_end = *seg_start + nilfs->ns_blocks_per_segment - 1;
323 if (segnum == 0)
324 *seg_start = nilfs->ns_first_data_block;
325}
326
327static inline sector_t
328nilfs_get_segment_start_blocknr(struct the_nilfs *nilfs, __u64 segnum)
329{
330 return (segnum == 0) ? nilfs->ns_first_data_block :
331 (sector_t)nilfs->ns_blocks_per_segment * segnum;
332}
333
334static inline __u64
335nilfs_get_segnum_of_block(struct the_nilfs *nilfs, sector_t blocknr)
336{
337 sector_t segnum = blocknr;
338
339 sector_div(segnum, nilfs->ns_blocks_per_segment);
340 return segnum;
341}
342
343static inline void
344nilfs_terminate_segment(struct the_nilfs *nilfs, sector_t seg_start,
345 sector_t seg_end)
346{
347 /* terminate the current full segment (used in case of I/O-error) */
348 nilfs->ns_pseg_offset = seg_end - seg_start + 1;
349}
350
351static inline void nilfs_shift_to_next_segment(struct the_nilfs *nilfs)
352{
353 /* move forward with a full segment */
354 nilfs->ns_segnum = nilfs->ns_nextnum;
355 nilfs->ns_pseg_offset = 0;
356 nilfs->ns_seg_seq++;
357}
358
359static inline __u64 nilfs_last_cno(struct the_nilfs *nilfs)
360{
361 __u64 cno;
362
363 spin_lock(&nilfs->ns_last_segment_lock);
364 cno = nilfs->ns_last_cno;
365 spin_unlock(&nilfs->ns_last_segment_lock);
366 return cno;
367}
368
Ryusuke Konishicece5522009-04-06 19:01:58 -0700369static inline int nilfs_segment_is_active(struct the_nilfs *nilfs, __u64 n)
370{
371 return n == nilfs->ns_segnum || n == nilfs->ns_nextnum;
372}
373
Andreas Rohnere2c76172014-10-13 15:53:20 -0700374static inline int nilfs_flush_device(struct the_nilfs *nilfs)
375{
376 int err;
377
378 if (!nilfs_test_opt(nilfs, BARRIER) || nilfs->ns_flushed_device)
379 return 0;
380
381 nilfs->ns_flushed_device = 1;
382 /*
383 * the store to ns_flushed_device must not be reordered after
384 * blkdev_issue_flush().
385 */
386 smp_wmb();
387
388 err = blkdev_issue_flush(nilfs->ns_bdev, GFP_KERNEL, NULL);
389 if (err != -EIO)
390 err = 0;
391 return err;
392}
393
Ryusuke Konishi65b46432009-04-06 19:01:23 -0700394#endif /* _THE_NILFS_H */