blob: 39ad501651625e393acbff5ffebd8b10b0ef64c6 [file] [log] [blame]
Boaz Harroshb14f8ab2008-10-27 18:27:55 +02001/*
2 * Copyright (C) 2005, 2006
Boaz Harrosh27d2e142009-06-14 17:23:09 +03003 * Avishay Traeger (avishay@gmail.com)
Boaz Harroshb14f8ab2008-10-27 18:27:55 +02004 * Copyright (C) 2008, 2009
5 * Boaz Harrosh <bharrosh@panasas.com>
6 *
7 * Copyrights for code taken from ext2:
8 * Copyright (C) 1992, 1993, 1994, 1995
9 * Remy Card (card@masi.ibp.fr)
10 * Laboratoire MASI - Institut Blaise Pascal
11 * Universite Pierre et Marie Curie (Paris VI)
12 * from
13 * linux/fs/minix/inode.c
14 * Copyright (C) 1991, 1992 Linus Torvalds
15 *
16 * This file is part of exofs.
17 *
18 * exofs is free software; you can redistribute it and/or modify
19 * it under the terms of the GNU General Public License as published by
20 * the Free Software Foundation. Since it is based on ext2, and the only
21 * valid version of GPL for the Linux kernel is version 2, the only valid
22 * version of GPL for exofs is version 2.
23 *
24 * exofs is distributed in the hope that it will be useful,
25 * but WITHOUT ANY WARRANTY; without even the implied warranty of
26 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
27 * GNU General Public License for more details.
28 *
29 * You should have received a copy of the GNU General Public License
30 * along with exofs; if not, write to the Free Software
31 * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA
32 */
Boaz Harrosh06886a52009-11-08 14:54:08 +020033#ifndef __EXOFS_H__
34#define __EXOFS_H__
Boaz Harroshb14f8ab2008-10-27 18:27:55 +020035
36#include <linux/fs.h>
37#include <linux/time.h>
Jens Axboeb3d0ab72010-04-22 12:26:04 +020038#include <linux/backing-dev.h>
Boaz Harrosh26ae93c2010-02-02 15:56:53 +020039#include <linux/pnfs_osd_xdr.h>
Boaz Harroshb14f8ab2008-10-27 18:27:55 +020040#include "common.h"
41
Boaz Harroshb14f8ab2008-10-27 18:27:55 +020042#define EXOFS_ERR(fmt, a...) printk(KERN_ERR "exofs: " fmt, ##a)
43
44#ifdef CONFIG_EXOFS_DEBUG
45#define EXOFS_DBGMSG(fmt, a...) \
46 printk(KERN_NOTICE "exofs @%s:%d: " fmt, __func__, __LINE__, ##a)
47#else
48#define EXOFS_DBGMSG(fmt, a...) \
49 do { if (0) printk(fmt, ##a); } while (0)
50#endif
51
52/* u64 has problems with printk this will cast it to unsigned long long */
53#define _LLU(x) (unsigned long long)(x)
54
Boaz Harrosh9e9db452011-08-05 15:06:04 -070055struct exofs_comp {
56 struct osd_obj_id obj;
57 u8 cred[OSD_CAP_LEN];
58};
Boaz Harrosh45d3abc2010-01-28 11:46:16 +020059
Boaz Harrosh9e9db452011-08-05 15:06:04 -070060struct exofs_layout {
Boaz Harrosh5d952b82010-02-01 13:35:51 +020061 /* Our way of looking at the data_map */
62 unsigned stripe_unit;
63 unsigned mirrors_p1;
64
65 unsigned group_width;
Boaz Harrosh50a76fd2010-02-11 13:01:39 +020066 u64 group_depth;
67 unsigned group_count;
Boaz Harrosh9e9db452011-08-05 15:06:04 -070068};
Boaz Harrosh5d952b82010-02-01 13:35:51 +020069
Boaz Harrosh9e9db452011-08-05 15:06:04 -070070struct exofs_components {
71 unsigned numdevs; /* Num of devices in array */
72 /* If @single_comp == EC_SINGLE_COMP, @comps points to a single
73 * component. else there are @numdevs components
74 */
75 enum EC_COMP_USAGE {
76 EC_SINGLE_COMP = 0, EC_MULTPLE_COMPS = 0xffffffff
77 } single_comp;
78 struct exofs_comp *comps;
79 struct osd_dev **ods; /* osd_dev array */
Boaz Harrosh45d3abc2010-01-28 11:46:16 +020080};
81
Boaz Harroshb14f8ab2008-10-27 18:27:55 +020082/*
83 * our extension to the in-memory superblock
84 */
85struct exofs_sb_info {
Boaz Harrosh6d4073e2011-07-27 17:51:53 -070086 struct backing_dev_info bdi; /* register our bdi with VFS */
Boaz Harrosh1cea3122011-02-03 17:53:25 +020087 struct exofs_sb_stats s_ess; /* Written often, pre-allocate*/
Boaz Harroshb14f8ab2008-10-27 18:27:55 +020088 int s_timeout; /* timeout for OSD operations */
89 uint64_t s_nextid; /* highest object ID used */
90 uint32_t s_numfiles; /* number of files on fs */
91 spinlock_t s_next_gen_lock; /* spinlock for gen # update */
92 u32 s_next_generation; /* next gen # to use */
93 atomic_t s_curr_pending; /* number of pending commands */
Boaz Harrosh04dc1e82009-11-16 16:03:05 +020094
Boaz Harrosh45d3abc2010-01-28 11:46:16 +020095 struct pnfs_osd_data_map data_map; /* Default raid to use
96 * FIXME: Needed ?
97 */
Boaz Harrosh6d4073e2011-07-27 17:51:53 -070098 struct exofs_layout layout; /* Default files layout */
Boaz Harrosh9e9db452011-08-05 15:06:04 -070099 struct exofs_comp one_comp; /* id & cred of partition id=0*/
100 struct exofs_components comps; /* comps for the partition */
Boaz Harrosh45d3abc2010-01-28 11:46:16 +0200101 struct osd_dev *_min_one_dev[1]; /* Place holder for one dev */
Boaz Harroshb14f8ab2008-10-27 18:27:55 +0200102};
103
104/*
105 * our extension to the in-memory inode
106 */
107struct exofs_i_info {
Boaz Harrosh518f1672010-01-21 20:00:02 +0200108 struct inode vfs_inode; /* normal in-memory inode */
109 wait_queue_head_t i_wq; /* wait queue for inode */
Boaz Harroshb14f8ab2008-10-27 18:27:55 +0200110 unsigned long i_flags; /* various atomic flags */
111 uint32_t i_data[EXOFS_IDATA];/*short symlink names and device #s*/
112 uint32_t i_dir_start_lookup; /* which page to start lookup */
Boaz Harroshb14f8ab2008-10-27 18:27:55 +0200113 uint64_t i_commit_size; /* the object's written length */
Boaz Harrosh9e9db452011-08-05 15:06:04 -0700114 struct exofs_comp one_comp; /* same component for all devices */
115 struct exofs_components comps; /* inode view of the device table */
Boaz Harroshb14f8ab2008-10-27 18:27:55 +0200116};
117
Boaz Harrosh06886a52009-11-08 14:54:08 +0200118static inline osd_id exofs_oi_objno(struct exofs_i_info *oi)
119{
120 return oi->vfs_inode.i_ino + EXOFS_OBJ_OFF;
121}
122
123struct exofs_io_state;
Boaz Harroshe1042ba2010-11-16 20:09:58 +0200124typedef void (*exofs_io_done_fn)(struct exofs_io_state *ios, void *private);
Boaz Harrosh06886a52009-11-08 14:54:08 +0200125
126struct exofs_io_state {
127 struct kref kref;
128
129 void *private;
130 exofs_io_done_fn done;
131
Boaz Harrosh45d3abc2010-01-28 11:46:16 +0200132 struct exofs_layout *layout;
Boaz Harrosh9e9db452011-08-05 15:06:04 -0700133 struct exofs_components *comps;
Boaz Harrosh06886a52009-11-08 14:54:08 +0200134
135 /* Global read/write IO*/
136 loff_t offset;
137 unsigned long length;
138 void *kern_buff;
Boaz Harrosh86093aa2010-01-28 18:24:06 +0200139
140 struct page **pages;
141 unsigned nr_pages;
142 unsigned pgbase;
Boaz Harrosh50a76fd2010-02-11 13:01:39 +0200143 unsigned pages_consumed;
Boaz Harrosh06886a52009-11-08 14:54:08 +0200144
145 /* Attributes */
146 unsigned in_attr_len;
147 struct osd_attr *in_attr;
148 unsigned out_attr_len;
149 struct osd_attr *out_attr;
150
Boaz Harroshe1042ba2010-11-16 20:09:58 +0200151 bool reading;
152
Boaz Harrosh06886a52009-11-08 14:54:08 +0200153 /* Variable array of size numdevs */
154 unsigned numdevs;
155 struct exofs_per_dev_state {
156 struct osd_request *or;
157 struct bio *bio;
Boaz Harrosh5d952b82010-02-01 13:35:51 +0200158 loff_t offset;
159 unsigned length;
160 unsigned dev;
Boaz Harrosh06886a52009-11-08 14:54:08 +0200161 } per_dev[];
162};
163
164static inline unsigned exofs_io_state_size(unsigned numdevs)
165{
166 return sizeof(struct exofs_io_state) +
167 sizeof(struct exofs_per_dev_state) * numdevs;
168}
169
Boaz Harroshb14f8ab2008-10-27 18:27:55 +0200170/*
171 * our inode flags
172 */
173#define OBJ_2BCREATED 0 /* object will be created soon*/
174#define OBJ_CREATED 1 /* object has been created on the osd*/
175
176static inline int obj_2bcreated(struct exofs_i_info *oi)
177{
178 return test_bit(OBJ_2BCREATED, &oi->i_flags);
179}
180
181static inline void set_obj_2bcreated(struct exofs_i_info *oi)
182{
183 set_bit(OBJ_2BCREATED, &oi->i_flags);
184}
185
186static inline int obj_created(struct exofs_i_info *oi)
187{
188 return test_bit(OBJ_CREATED, &oi->i_flags);
189}
190
191static inline void set_obj_created(struct exofs_i_info *oi)
192{
193 set_bit(OBJ_CREATED, &oi->i_flags);
194}
195
196int __exofs_wait_obj_created(struct exofs_i_info *oi);
197static inline int wait_obj_created(struct exofs_i_info *oi)
198{
199 if (likely(obj_created(oi)))
200 return 0;
201
202 return __exofs_wait_obj_created(oi);
203}
204
205/*
206 * get to our inode from the vfs inode
207 */
208static inline struct exofs_i_info *exofs_i(struct inode *inode)
209{
210 return container_of(inode, struct exofs_i_info, vfs_inode);
211}
212
Boaz Harroshe6af00f2008-10-28 15:38:12 +0200213/*
214 * Maximum count of links to a file
215 */
216#define EXOFS_LINK_MAX 32000
217
Boaz Harroshe8062712008-10-27 18:37:02 +0200218/*************************
219 * function declarations *
220 *************************/
Boaz Harrosh06886a52009-11-08 14:54:08 +0200221
222/* ios.c */
Boaz Harrosh9e9db452011-08-05 15:06:04 -0700223int exofs_get_rw_state(struct exofs_layout *layout,
224 struct exofs_components *comps,
225 bool is_reading, u64 offset, u64 length,
226 struct exofs_io_state **ios);
227int exofs_get_io_state(struct exofs_layout *layout,
228 struct exofs_components *comps,
229 struct exofs_io_state **ios);
Boaz Harrosh06886a52009-11-08 14:54:08 +0200230void exofs_put_io_state(struct exofs_io_state *ios);
231
232int exofs_check_io(struct exofs_io_state *ios, u64 *resid);
233
234int exofs_sbi_create(struct exofs_io_state *ios);
235int exofs_sbi_remove(struct exofs_io_state *ios);
236int exofs_sbi_write(struct exofs_io_state *ios);
237int exofs_sbi_read(struct exofs_io_state *ios);
Boaz Harrosh9e9db452011-08-05 15:06:04 -0700238int exofs_truncate(struct exofs_layout *layout, struct exofs_components *comps,
239 u64 size);
Boaz Harrosh06886a52009-11-08 14:54:08 +0200240
241int extract_attr_from_ios(struct exofs_io_state *ios, struct osd_attr *attr);
Boaz Harrosh85e44df2011-05-16 15:26:47 +0300242extern const struct osd_attr g_attr_logical_length;
Boaz Harrosh06886a52009-11-08 14:54:08 +0200243
Boaz Harroshe8062712008-10-27 18:37:02 +0200244/* inode.c */
bharrosh@panasas.com66cd6ca2010-10-07 14:28:18 -0400245unsigned exofs_max_io_pages(struct exofs_layout *layout,
246 unsigned expected_pages);
Boaz Harroshe8062712008-10-27 18:37:02 +0200247int exofs_setattr(struct dentry *, struct iattr *);
Boaz Harroshbeaec072008-10-27 19:31:34 +0200248int exofs_write_begin(struct file *file, struct address_space *mapping,
249 loff_t pos, unsigned len, unsigned flags,
250 struct page **pagep, void **fsdata);
Boaz Harroshe6af00f2008-10-28 15:38:12 +0200251extern struct inode *exofs_iget(struct super_block *, unsigned long);
252struct inode *exofs_new_inode(struct inode *, int);
Christoph Hellwiga9185b42010-03-05 09:21:37 +0100253extern int exofs_write_inode(struct inode *, struct writeback_control *wbc);
Al Viro4ec70c92010-06-07 11:42:26 -0400254extern void exofs_evict_inode(struct inode *);
Boaz Harroshe6af00f2008-10-28 15:38:12 +0200255
256/* dir.c: */
257int exofs_add_link(struct dentry *, struct inode *);
258ino_t exofs_inode_by_name(struct inode *, struct dentry *);
259int exofs_delete_entry(struct exofs_dir_entry *, struct page *);
260int exofs_make_empty(struct inode *, struct inode *);
261struct exofs_dir_entry *exofs_find_entry(struct inode *, struct dentry *,
262 struct page **);
263int exofs_empty_dir(struct inode *);
264struct exofs_dir_entry *exofs_dotdot(struct inode *, struct page **);
Boaz Harrosh8cf74b32009-03-22 12:47:26 +0200265ino_t exofs_parent_ino(struct dentry *child);
Boaz Harroshe6af00f2008-10-28 15:38:12 +0200266int exofs_set_link(struct inode *, struct exofs_dir_entry *, struct page *,
267 struct inode *);
Boaz Harroshe8062712008-10-27 18:37:02 +0200268
Boaz Harroshbaaf94c2009-06-14 16:52:10 +0300269/* super.c */
Boaz Harrosh85e44df2011-05-16 15:26:47 +0300270void exofs_make_credential(u8 cred_a[OSD_CAP_LEN],
271 const struct osd_obj_id *obj);
Boaz Harrosh1cea3122011-02-03 17:53:25 +0200272int exofs_sbi_write_stats(struct exofs_sb_info *sbi);
Boaz Harroshbaaf94c2009-06-14 16:52:10 +0300273
Boaz Harroshe8062712008-10-27 18:37:02 +0200274/*********************
275 * operation vectors *
276 *********************/
Boaz Harroshe6af00f2008-10-28 15:38:12 +0200277/* dir.c: */
278extern const struct file_operations exofs_dir_operations;
279
Boaz Harroshe8062712008-10-27 18:37:02 +0200280/* file.c */
281extern const struct inode_operations exofs_file_inode_operations;
282extern const struct file_operations exofs_file_operations;
283
Boaz Harroshbeaec072008-10-27 19:31:34 +0200284/* inode.c */
285extern const struct address_space_operations exofs_aops;
286
Boaz Harroshe6af00f2008-10-28 15:38:12 +0200287/* namei.c */
288extern const struct inode_operations exofs_dir_inode_operations;
289extern const struct inode_operations exofs_special_inode_operations;
290
Boaz Harrosh982980d2008-10-27 19:04:34 +0200291/* symlink.c */
292extern const struct inode_operations exofs_symlink_inode_operations;
293extern const struct inode_operations exofs_fast_symlink_inode_operations;
294
Boaz Harrosh9e9db452011-08-05 15:06:04 -0700295/* exofs_init_comps will initialize an exofs_components device array
296 * pointing to a single exofs_comp struct, and a round-robin view
297 * of the device table.
298 * The first device of each inode is the [inode->ino % num_devices]
299 * and the rest of the devices sequentially following where the
300 * first device is after the last device.
301 * It is assumed that the global device array at @sbi is twice
302 * bigger and that the device table repeats twice.
303 * See: exofs_read_lookup_dev_table()
304 */
305static inline void exofs_init_comps(struct exofs_components *comps,
306 struct exofs_comp *one_comp,
307 struct exofs_sb_info *sbi, osd_id oid)
308{
309 unsigned dev_mod = (unsigned)oid, first_dev;
310
311 one_comp->obj.partition = sbi->one_comp.obj.partition;
312 one_comp->obj.id = oid;
313 exofs_make_credential(one_comp->cred, &one_comp->obj);
314
315 comps->numdevs = sbi->comps.numdevs;
316 comps->single_comp = EC_SINGLE_COMP;
317 comps->comps = one_comp;
318
319 /* Round robin device view of the table */
320 first_dev = (dev_mod * sbi->layout.mirrors_p1) % sbi->comps.numdevs;
321 comps->ods = sbi->comps.ods + first_dev;
322}
323
Boaz Harroshb14f8ab2008-10-27 18:27:55 +0200324#endif