blob: 8442e353309f5d9eb09e39c21f3f7ddc31cc8c3f [file] [log] [blame]
Boaz Harroshb14f8ab2008-10-27 18:27:55 +02001/*
2 * Copyright (C) 2005, 2006
Boaz Harrosh27d2e142009-06-14 17:23:09 +03003 * Avishay Traeger (avishay@gmail.com)
Boaz Harroshb14f8ab2008-10-27 18:27:55 +02004 * Copyright (C) 2008, 2009
5 * Boaz Harrosh <bharrosh@panasas.com>
6 *
7 * Copyrights for code taken from ext2:
8 * Copyright (C) 1992, 1993, 1994, 1995
9 * Remy Card (card@masi.ibp.fr)
10 * Laboratoire MASI - Institut Blaise Pascal
11 * Universite Pierre et Marie Curie (Paris VI)
12 * from
13 * linux/fs/minix/inode.c
14 * Copyright (C) 1991, 1992 Linus Torvalds
15 *
16 * This file is part of exofs.
17 *
18 * exofs is free software; you can redistribute it and/or modify
19 * it under the terms of the GNU General Public License as published by
20 * the Free Software Foundation. Since it is based on ext2, and the only
21 * valid version of GPL for the Linux kernel is version 2, the only valid
22 * version of GPL for exofs is version 2.
23 *
24 * exofs is distributed in the hope that it will be useful,
25 * but WITHOUT ANY WARRANTY; without even the implied warranty of
26 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
27 * GNU General Public License for more details.
28 *
29 * You should have received a copy of the GNU General Public License
30 * along with exofs; if not, write to the Free Software
31 * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA
32 */
Boaz Harrosh06886a52009-11-08 14:54:08 +020033#ifndef __EXOFS_H__
34#define __EXOFS_H__
Boaz Harroshb14f8ab2008-10-27 18:27:55 +020035
36#include <linux/fs.h>
37#include <linux/time.h>
38#include "common.h"
39
Boaz Harrosh04dc1e82009-11-16 16:03:05 +020040/* FIXME: Remove once pnfs hits mainline
41 * #include <linux/exportfs/pnfs_osd_xdr.h>
42 */
43#include "pnfs.h"
44
Boaz Harroshb14f8ab2008-10-27 18:27:55 +020045#define EXOFS_ERR(fmt, a...) printk(KERN_ERR "exofs: " fmt, ##a)
46
47#ifdef CONFIG_EXOFS_DEBUG
48#define EXOFS_DBGMSG(fmt, a...) \
49 printk(KERN_NOTICE "exofs @%s:%d: " fmt, __func__, __LINE__, ##a)
50#else
51#define EXOFS_DBGMSG(fmt, a...) \
52 do { if (0) printk(fmt, ##a); } while (0)
53#endif
54
55/* u64 has problems with printk this will cast it to unsigned long long */
56#define _LLU(x) (unsigned long long)(x)
57
Boaz Harrosh45d3abc2010-01-28 11:46:16 +020058struct exofs_layout {
59 osd_id s_pid; /* partition ID of file system*/
60
Boaz Harrosh5d952b82010-02-01 13:35:51 +020061 /* Our way of looking at the data_map */
62 unsigned stripe_unit;
63 unsigned mirrors_p1;
64
65 unsigned group_width;
Boaz Harrosh50a76fd2010-02-11 13:01:39 +020066 u64 group_depth;
67 unsigned group_count;
Boaz Harrosh5d952b82010-02-01 13:35:51 +020068
69 enum exofs_inode_layout_gen_functions lay_func;
70
Boaz Harrosh45d3abc2010-01-28 11:46:16 +020071 unsigned s_numdevs; /* Num of devices in array */
72 struct osd_dev *s_ods[0]; /* Variable length */
73};
74
Boaz Harroshb14f8ab2008-10-27 18:27:55 +020075/*
76 * our extension to the in-memory superblock
77 */
78struct exofs_sb_info {
Boaz Harrosh06886a52009-11-08 14:54:08 +020079 struct exofs_fscb s_fscb; /* Written often, pre-allocate*/
Boaz Harroshb14f8ab2008-10-27 18:27:55 +020080 int s_timeout; /* timeout for OSD operations */
81 uint64_t s_nextid; /* highest object ID used */
82 uint32_t s_numfiles; /* number of files on fs */
83 spinlock_t s_next_gen_lock; /* spinlock for gen # update */
84 u32 s_next_generation; /* next gen # to use */
85 atomic_t s_curr_pending; /* number of pending commands */
Boaz Harrosh04dc1e82009-11-16 16:03:05 +020086 uint8_t s_cred[OSD_CAP_LEN]; /* credential for the fscb */
87
Boaz Harrosh45d3abc2010-01-28 11:46:16 +020088 struct pnfs_osd_data_map data_map; /* Default raid to use
89 * FIXME: Needed ?
90 */
91/* struct exofs_layout dir_layout;*/ /* Default dir layout */
92 struct exofs_layout layout; /* Default files layout,
93 * contains the variable osd_dev
94 * array. Keep last */
95 struct osd_dev *_min_one_dev[1]; /* Place holder for one dev */
Boaz Harroshb14f8ab2008-10-27 18:27:55 +020096};
97
98/*
99 * our extension to the in-memory inode
100 */
101struct exofs_i_info {
Boaz Harrosh518f1672010-01-21 20:00:02 +0200102 struct inode vfs_inode; /* normal in-memory inode */
103 wait_queue_head_t i_wq; /* wait queue for inode */
Boaz Harroshb14f8ab2008-10-27 18:27:55 +0200104 unsigned long i_flags; /* various atomic flags */
105 uint32_t i_data[EXOFS_IDATA];/*short symlink names and device #s*/
106 uint32_t i_dir_start_lookup; /* which page to start lookup */
Boaz Harroshb14f8ab2008-10-27 18:27:55 +0200107 uint64_t i_commit_size; /* the object's written length */
108 uint8_t i_cred[OSD_CAP_LEN];/* all-powerful credential */
Boaz Harroshb14f8ab2008-10-27 18:27:55 +0200109};
110
Boaz Harrosh06886a52009-11-08 14:54:08 +0200111static inline osd_id exofs_oi_objno(struct exofs_i_info *oi)
112{
113 return oi->vfs_inode.i_ino + EXOFS_OBJ_OFF;
114}
115
116struct exofs_io_state;
117typedef void (*exofs_io_done_fn)(struct exofs_io_state *or, void *private);
118
119struct exofs_io_state {
120 struct kref kref;
121
122 void *private;
123 exofs_io_done_fn done;
124
Boaz Harrosh45d3abc2010-01-28 11:46:16 +0200125 struct exofs_layout *layout;
Boaz Harrosh06886a52009-11-08 14:54:08 +0200126 struct osd_obj_id obj;
127 u8 *cred;
128
129 /* Global read/write IO*/
130 loff_t offset;
131 unsigned long length;
132 void *kern_buff;
Boaz Harrosh86093aa2010-01-28 18:24:06 +0200133
134 struct page **pages;
135 unsigned nr_pages;
136 unsigned pgbase;
Boaz Harrosh50a76fd2010-02-11 13:01:39 +0200137 unsigned pages_consumed;
Boaz Harrosh06886a52009-11-08 14:54:08 +0200138
139 /* Attributes */
140 unsigned in_attr_len;
141 struct osd_attr *in_attr;
142 unsigned out_attr_len;
143 struct osd_attr *out_attr;
144
145 /* Variable array of size numdevs */
146 unsigned numdevs;
147 struct exofs_per_dev_state {
148 struct osd_request *or;
149 struct bio *bio;
Boaz Harrosh5d952b82010-02-01 13:35:51 +0200150 loff_t offset;
151 unsigned length;
152 unsigned dev;
Boaz Harrosh06886a52009-11-08 14:54:08 +0200153 } per_dev[];
154};
155
156static inline unsigned exofs_io_state_size(unsigned numdevs)
157{
158 return sizeof(struct exofs_io_state) +
159 sizeof(struct exofs_per_dev_state) * numdevs;
160}
161
Boaz Harroshb14f8ab2008-10-27 18:27:55 +0200162/*
163 * our inode flags
164 */
165#define OBJ_2BCREATED 0 /* object will be created soon*/
166#define OBJ_CREATED 1 /* object has been created on the osd*/
167
168static inline int obj_2bcreated(struct exofs_i_info *oi)
169{
170 return test_bit(OBJ_2BCREATED, &oi->i_flags);
171}
172
173static inline void set_obj_2bcreated(struct exofs_i_info *oi)
174{
175 set_bit(OBJ_2BCREATED, &oi->i_flags);
176}
177
178static inline int obj_created(struct exofs_i_info *oi)
179{
180 return test_bit(OBJ_CREATED, &oi->i_flags);
181}
182
183static inline void set_obj_created(struct exofs_i_info *oi)
184{
185 set_bit(OBJ_CREATED, &oi->i_flags);
186}
187
188int __exofs_wait_obj_created(struct exofs_i_info *oi);
189static inline int wait_obj_created(struct exofs_i_info *oi)
190{
191 if (likely(obj_created(oi)))
192 return 0;
193
194 return __exofs_wait_obj_created(oi);
195}
196
197/*
198 * get to our inode from the vfs inode
199 */
200static inline struct exofs_i_info *exofs_i(struct inode *inode)
201{
202 return container_of(inode, struct exofs_i_info, vfs_inode);
203}
204
Boaz Harroshe6af00f2008-10-28 15:38:12 +0200205/*
Boaz Harroshd9c740d2010-01-28 11:58:08 +0200206 * Given a layout, object_number and stripe_index return the associated global
207 * dev_index
208 */
209unsigned exofs_layout_od_id(struct exofs_layout *layout,
210 osd_id obj_no, unsigned layout_index);
211/*
Boaz Harroshe6af00f2008-10-28 15:38:12 +0200212 * Maximum count of links to a file
213 */
214#define EXOFS_LINK_MAX 32000
215
Boaz Harroshe8062712008-10-27 18:37:02 +0200216/*************************
217 * function declarations *
218 *************************/
Boaz Harrosh06886a52009-11-08 14:54:08 +0200219
220/* ios.c */
221void exofs_make_credential(u8 cred_a[OSD_CAP_LEN],
222 const struct osd_obj_id *obj);
223int exofs_read_kern(struct osd_dev *od, u8 *cred, struct osd_obj_id *obj,
224 u64 offset, void *p, unsigned length);
225
Boaz Harrosh45d3abc2010-01-28 11:46:16 +0200226int exofs_get_io_state(struct exofs_layout *layout,
227 struct exofs_io_state **ios);
Boaz Harrosh06886a52009-11-08 14:54:08 +0200228void exofs_put_io_state(struct exofs_io_state *ios);
229
230int exofs_check_io(struct exofs_io_state *ios, u64 *resid);
231
232int exofs_sbi_create(struct exofs_io_state *ios);
233int exofs_sbi_remove(struct exofs_io_state *ios);
234int exofs_sbi_write(struct exofs_io_state *ios);
235int exofs_sbi_read(struct exofs_io_state *ios);
236
237int extract_attr_from_ios(struct exofs_io_state *ios, struct osd_attr *attr);
238
239int exofs_oi_truncate(struct exofs_i_info *oi, u64 new_len);
240static inline int exofs_oi_write(struct exofs_i_info *oi,
241 struct exofs_io_state *ios)
242{
243 ios->obj.id = exofs_oi_objno(oi);
244 ios->cred = oi->i_cred;
245 return exofs_sbi_write(ios);
246}
247
248static inline int exofs_oi_read(struct exofs_i_info *oi,
249 struct exofs_io_state *ios)
250{
251 ios->obj.id = exofs_oi_objno(oi);
252 ios->cred = oi->i_cred;
253 return exofs_sbi_read(ios);
254}
255
Boaz Harroshe8062712008-10-27 18:37:02 +0200256/* inode.c */
257void exofs_truncate(struct inode *inode);
258int exofs_setattr(struct dentry *, struct iattr *);
Boaz Harroshbeaec072008-10-27 19:31:34 +0200259int exofs_write_begin(struct file *file, struct address_space *mapping,
260 loff_t pos, unsigned len, unsigned flags,
261 struct page **pagep, void **fsdata);
Boaz Harroshe6af00f2008-10-28 15:38:12 +0200262extern struct inode *exofs_iget(struct super_block *, unsigned long);
263struct inode *exofs_new_inode(struct inode *, int);
Christoph Hellwiga9185b42010-03-05 09:21:37 +0100264extern int exofs_write_inode(struct inode *, struct writeback_control *wbc);
Boaz Harroshba9e5e92008-10-28 16:11:41 +0200265extern void exofs_delete_inode(struct inode *);
Boaz Harroshe6af00f2008-10-28 15:38:12 +0200266
267/* dir.c: */
268int exofs_add_link(struct dentry *, struct inode *);
269ino_t exofs_inode_by_name(struct inode *, struct dentry *);
270int exofs_delete_entry(struct exofs_dir_entry *, struct page *);
271int exofs_make_empty(struct inode *, struct inode *);
272struct exofs_dir_entry *exofs_find_entry(struct inode *, struct dentry *,
273 struct page **);
274int exofs_empty_dir(struct inode *);
275struct exofs_dir_entry *exofs_dotdot(struct inode *, struct page **);
Boaz Harrosh8cf74b32009-03-22 12:47:26 +0200276ino_t exofs_parent_ino(struct dentry *child);
Boaz Harroshe6af00f2008-10-28 15:38:12 +0200277int exofs_set_link(struct inode *, struct exofs_dir_entry *, struct page *,
278 struct inode *);
Boaz Harroshe8062712008-10-27 18:37:02 +0200279
Boaz Harroshbaaf94c2009-06-14 16:52:10 +0300280/* super.c */
281int exofs_sync_fs(struct super_block *sb, int wait);
282
Boaz Harroshe8062712008-10-27 18:37:02 +0200283/*********************
284 * operation vectors *
285 *********************/
Boaz Harroshe6af00f2008-10-28 15:38:12 +0200286/* dir.c: */
287extern const struct file_operations exofs_dir_operations;
288
Boaz Harroshe8062712008-10-27 18:37:02 +0200289/* file.c */
290extern const struct inode_operations exofs_file_inode_operations;
291extern const struct file_operations exofs_file_operations;
292
Boaz Harroshbeaec072008-10-27 19:31:34 +0200293/* inode.c */
294extern const struct address_space_operations exofs_aops;
Boaz Harrosh06886a52009-11-08 14:54:08 +0200295extern const struct osd_attr g_attr_logical_length;
Boaz Harroshbeaec072008-10-27 19:31:34 +0200296
Boaz Harroshe6af00f2008-10-28 15:38:12 +0200297/* namei.c */
298extern const struct inode_operations exofs_dir_inode_operations;
299extern const struct inode_operations exofs_special_inode_operations;
300
Boaz Harrosh982980d2008-10-27 19:04:34 +0200301/* symlink.c */
302extern const struct inode_operations exofs_symlink_inode_operations;
303extern const struct inode_operations exofs_fast_symlink_inode_operations;
304
Boaz Harroshb14f8ab2008-10-27 18:27:55 +0200305#endif