blob: fffe86fd7a4260cc3bce3b6910f930ee7f32f5d6 [file] [log] [blame]
Boaz Harroshb14f8ab2008-10-27 18:27:55 +02001/*
2 * Copyright (C) 2005, 2006
Boaz Harrosh27d2e142009-06-14 17:23:09 +03003 * Avishay Traeger (avishay@gmail.com)
Boaz Harroshb14f8ab2008-10-27 18:27:55 +02004 * Copyright (C) 2008, 2009
5 * Boaz Harrosh <bharrosh@panasas.com>
6 *
7 * Copyrights for code taken from ext2:
8 * Copyright (C) 1992, 1993, 1994, 1995
9 * Remy Card (card@masi.ibp.fr)
10 * Laboratoire MASI - Institut Blaise Pascal
11 * Universite Pierre et Marie Curie (Paris VI)
12 * from
13 * linux/fs/minix/inode.c
14 * Copyright (C) 1991, 1992 Linus Torvalds
15 *
16 * This file is part of exofs.
17 *
18 * exofs is free software; you can redistribute it and/or modify
19 * it under the terms of the GNU General Public License as published by
20 * the Free Software Foundation. Since it is based on ext2, and the only
21 * valid version of GPL for the Linux kernel is version 2, the only valid
22 * version of GPL for exofs is version 2.
23 *
24 * exofs is distributed in the hope that it will be useful,
25 * but WITHOUT ANY WARRANTY; without even the implied warranty of
26 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
27 * GNU General Public License for more details.
28 *
29 * You should have received a copy of the GNU General Public License
30 * along with exofs; if not, write to the Free Software
31 * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA
32 */
Boaz Harrosh06886a52009-11-08 14:54:08 +020033#ifndef __EXOFS_H__
34#define __EXOFS_H__
Boaz Harroshb14f8ab2008-10-27 18:27:55 +020035
36#include <linux/fs.h>
37#include <linux/time.h>
Jens Axboeb3d0ab72010-04-22 12:26:04 +020038#include <linux/backing-dev.h>
Boaz Harrosh8ff660a2011-08-06 19:26:31 -070039#include <scsi/osd_ore.h>
40
Boaz Harroshb14f8ab2008-10-27 18:27:55 +020041#include "common.h"
42
Boaz Harroshb14f8ab2008-10-27 18:27:55 +020043#define EXOFS_ERR(fmt, a...) printk(KERN_ERR "exofs: " fmt, ##a)
44
45#ifdef CONFIG_EXOFS_DEBUG
46#define EXOFS_DBGMSG(fmt, a...) \
47 printk(KERN_NOTICE "exofs @%s:%d: " fmt, __func__, __LINE__, ##a)
48#else
49#define EXOFS_DBGMSG(fmt, a...) \
50 do { if (0) printk(fmt, ##a); } while (0)
51#endif
52
53/* u64 has problems with printk this will cast it to unsigned long long */
54#define _LLU(x) (unsigned long long)(x)
55
Boaz Harroshd866d872011-09-28 14:43:09 +030056struct exofs_dev {
57 struct ore_dev ored;
58 unsigned did;
Sachin Bhamare8b56a302012-03-14 18:01:45 -070059 unsigned urilen;
60 uint8_t *uri;
61 struct kobject ed_kobj;
Boaz Harroshd866d872011-09-28 14:43:09 +030062};
Boaz Harroshb14f8ab2008-10-27 18:27:55 +020063/*
64 * our extension to the in-memory superblock
65 */
66struct exofs_sb_info {
Boaz Harrosh6d4073e2011-07-27 17:51:53 -070067 struct backing_dev_info bdi; /* register our bdi with VFS */
Boaz Harrosh1cea3122011-02-03 17:53:25 +020068 struct exofs_sb_stats s_ess; /* Written often, pre-allocate*/
Boaz Harroshb14f8ab2008-10-27 18:27:55 +020069 int s_timeout; /* timeout for OSD operations */
70 uint64_t s_nextid; /* highest object ID used */
71 uint32_t s_numfiles; /* number of files on fs */
72 spinlock_t s_next_gen_lock; /* spinlock for gen # update */
73 u32 s_next_generation; /* next gen # to use */
74 atomic_t s_curr_pending; /* number of pending commands */
Boaz Harrosh04dc1e82009-11-16 16:03:05 +020075
Boaz Harrosh8ff660a2011-08-06 19:26:31 -070076 struct ore_layout layout; /* Default files layout */
77 struct ore_comp one_comp; /* id & cred of partition id=0*/
Boaz Harrosh5bf696d2011-09-28 11:39:59 +030078 struct ore_components oc; /* comps for the partition */
Sachin Bhamare8b56a302012-03-14 18:01:45 -070079 struct kobject s_kobj; /* holds per-sbi kobject */
Boaz Harroshb14f8ab2008-10-27 18:27:55 +020080};
81
82/*
83 * our extension to the in-memory inode
84 */
85struct exofs_i_info {
Boaz Harrosh518f1672010-01-21 20:00:02 +020086 struct inode vfs_inode; /* normal in-memory inode */
87 wait_queue_head_t i_wq; /* wait queue for inode */
Boaz Harroshb14f8ab2008-10-27 18:27:55 +020088 unsigned long i_flags; /* various atomic flags */
89 uint32_t i_data[EXOFS_IDATA];/*short symlink names and device #s*/
90 uint32_t i_dir_start_lookup; /* which page to start lookup */
Boaz Harroshb14f8ab2008-10-27 18:27:55 +020091 uint64_t i_commit_size; /* the object's written length */
Boaz Harrosh8ff660a2011-08-06 19:26:31 -070092 struct ore_comp one_comp; /* same component for all devices */
Boaz Harrosh5bf696d2011-09-28 11:39:59 +030093 struct ore_components oc; /* inode view of the device table */
Boaz Harroshb14f8ab2008-10-27 18:27:55 +020094};
95
Boaz Harrosh06886a52009-11-08 14:54:08 +020096static inline osd_id exofs_oi_objno(struct exofs_i_info *oi)
97{
98 return oi->vfs_inode.i_ino + EXOFS_OBJ_OFF;
99}
100
Boaz Harroshb14f8ab2008-10-27 18:27:55 +0200101/*
102 * our inode flags
103 */
104#define OBJ_2BCREATED 0 /* object will be created soon*/
105#define OBJ_CREATED 1 /* object has been created on the osd*/
106
107static inline int obj_2bcreated(struct exofs_i_info *oi)
108{
109 return test_bit(OBJ_2BCREATED, &oi->i_flags);
110}
111
112static inline void set_obj_2bcreated(struct exofs_i_info *oi)
113{
114 set_bit(OBJ_2BCREATED, &oi->i_flags);
115}
116
117static inline int obj_created(struct exofs_i_info *oi)
118{
119 return test_bit(OBJ_CREATED, &oi->i_flags);
120}
121
122static inline void set_obj_created(struct exofs_i_info *oi)
123{
124 set_bit(OBJ_CREATED, &oi->i_flags);
125}
126
127int __exofs_wait_obj_created(struct exofs_i_info *oi);
128static inline int wait_obj_created(struct exofs_i_info *oi)
129{
130 if (likely(obj_created(oi)))
131 return 0;
132
133 return __exofs_wait_obj_created(oi);
134}
135
136/*
137 * get to our inode from the vfs inode
138 */
139static inline struct exofs_i_info *exofs_i(struct inode *inode)
140{
141 return container_of(inode, struct exofs_i_info, vfs_inode);
142}
143
Boaz Harroshe6af00f2008-10-28 15:38:12 +0200144/*
145 * Maximum count of links to a file
146 */
147#define EXOFS_LINK_MAX 32000
148
Boaz Harroshe8062712008-10-27 18:37:02 +0200149/*************************
150 * function declarations *
151 *************************/
Boaz Harrosh06886a52009-11-08 14:54:08 +0200152
Boaz Harroshe8062712008-10-27 18:37:02 +0200153/* inode.c */
Boaz Harrosh8ff660a2011-08-06 19:26:31 -0700154unsigned exofs_max_io_pages(struct ore_layout *layout,
bharrosh@panasas.com66cd6ca2010-10-07 14:28:18 -0400155 unsigned expected_pages);
Boaz Harroshe8062712008-10-27 18:37:02 +0200156int exofs_setattr(struct dentry *, struct iattr *);
Boaz Harroshbeaec072008-10-27 19:31:34 +0200157int exofs_write_begin(struct file *file, struct address_space *mapping,
158 loff_t pos, unsigned len, unsigned flags,
159 struct page **pagep, void **fsdata);
Boaz Harroshe6af00f2008-10-28 15:38:12 +0200160extern struct inode *exofs_iget(struct super_block *, unsigned long);
Al Virobef41c22011-07-26 03:07:49 -0400161struct inode *exofs_new_inode(struct inode *, umode_t);
Christoph Hellwiga9185b42010-03-05 09:21:37 +0100162extern int exofs_write_inode(struct inode *, struct writeback_control *wbc);
Al Viro4ec70c92010-06-07 11:42:26 -0400163extern void exofs_evict_inode(struct inode *);
Boaz Harroshe6af00f2008-10-28 15:38:12 +0200164
165/* dir.c: */
166int exofs_add_link(struct dentry *, struct inode *);
167ino_t exofs_inode_by_name(struct inode *, struct dentry *);
168int exofs_delete_entry(struct exofs_dir_entry *, struct page *);
169int exofs_make_empty(struct inode *, struct inode *);
170struct exofs_dir_entry *exofs_find_entry(struct inode *, struct dentry *,
171 struct page **);
172int exofs_empty_dir(struct inode *);
173struct exofs_dir_entry *exofs_dotdot(struct inode *, struct page **);
Boaz Harrosh8cf74b32009-03-22 12:47:26 +0200174ino_t exofs_parent_ino(struct dentry *child);
Boaz Harroshe6af00f2008-10-28 15:38:12 +0200175int exofs_set_link(struct inode *, struct exofs_dir_entry *, struct page *,
176 struct inode *);
Boaz Harroshe8062712008-10-27 18:37:02 +0200177
Boaz Harroshbaaf94c2009-06-14 16:52:10 +0300178/* super.c */
Boaz Harrosh85e44df2011-05-16 15:26:47 +0300179void exofs_make_credential(u8 cred_a[OSD_CAP_LEN],
180 const struct osd_obj_id *obj);
Boaz Harrosh1cea3122011-02-03 17:53:25 +0200181int exofs_sbi_write_stats(struct exofs_sb_info *sbi);
Boaz Harroshbaaf94c2009-06-14 16:52:10 +0300182
Sachin Bhamare8b56a302012-03-14 18:01:45 -0700183/* sys.c */
184int exofs_sysfs_init(void);
185void exofs_sysfs_uninit(void);
186int exofs_sysfs_sb_add(struct exofs_sb_info *sbi,
187 struct exofs_dt_device_info *dt_dev);
188void exofs_sysfs_sb_del(struct exofs_sb_info *sbi);
189int exofs_sysfs_odev_add(struct exofs_dev *edev,
190 struct exofs_sb_info *sbi);
191void exofs_sysfs_dbg_print(void);
192
Boaz Harroshe8062712008-10-27 18:37:02 +0200193/*********************
194 * operation vectors *
195 *********************/
Boaz Harroshe6af00f2008-10-28 15:38:12 +0200196/* dir.c: */
197extern const struct file_operations exofs_dir_operations;
198
Boaz Harroshe8062712008-10-27 18:37:02 +0200199/* file.c */
200extern const struct inode_operations exofs_file_inode_operations;
201extern const struct file_operations exofs_file_operations;
202
Boaz Harroshbeaec072008-10-27 19:31:34 +0200203/* inode.c */
204extern const struct address_space_operations exofs_aops;
205
Boaz Harroshe6af00f2008-10-28 15:38:12 +0200206/* namei.c */
207extern const struct inode_operations exofs_dir_inode_operations;
208extern const struct inode_operations exofs_special_inode_operations;
209
Boaz Harrosh982980d2008-10-27 19:04:34 +0200210/* symlink.c */
211extern const struct inode_operations exofs_symlink_inode_operations;
212extern const struct inode_operations exofs_fast_symlink_inode_operations;
213
Boaz Harrosh8ff660a2011-08-06 19:26:31 -0700214/* exofs_init_comps will initialize an ore_components device array
215 * pointing to a single ore_comp struct, and a round-robin view
Boaz Harrosh9e9db452011-08-05 15:06:04 -0700216 * of the device table.
217 * The first device of each inode is the [inode->ino % num_devices]
218 * and the rest of the devices sequentially following where the
219 * first device is after the last device.
220 * It is assumed that the global device array at @sbi is twice
221 * bigger and that the device table repeats twice.
222 * See: exofs_read_lookup_dev_table()
223 */
Boaz Harrosh5bf696d2011-09-28 11:39:59 +0300224static inline void exofs_init_comps(struct ore_components *oc,
Boaz Harrosh8ff660a2011-08-06 19:26:31 -0700225 struct ore_comp *one_comp,
Boaz Harrosh9e9db452011-08-05 15:06:04 -0700226 struct exofs_sb_info *sbi, osd_id oid)
227{
228 unsigned dev_mod = (unsigned)oid, first_dev;
229
230 one_comp->obj.partition = sbi->one_comp.obj.partition;
231 one_comp->obj.id = oid;
232 exofs_make_credential(one_comp->cred, &one_comp->obj);
233
Boaz Harrosh3bd98562011-09-28 12:04:23 +0300234 oc->first_dev = 0;
Boaz Harroshd866d872011-09-28 14:43:09 +0300235 oc->numdevs = sbi->layout.group_width * sbi->layout.mirrors_p1 *
236 sbi->layout.group_count;
Boaz Harrosh5bf696d2011-09-28 11:39:59 +0300237 oc->single_comp = EC_SINGLE_COMP;
238 oc->comps = one_comp;
Boaz Harrosh9e9db452011-08-05 15:06:04 -0700239
240 /* Round robin device view of the table */
Boaz Harrosh5bf696d2011-09-28 11:39:59 +0300241 first_dev = (dev_mod * sbi->layout.mirrors_p1) % sbi->oc.numdevs;
Boaz Harroshd866d872011-09-28 14:43:09 +0300242 oc->ods = &sbi->oc.ods[first_dev];
Boaz Harrosh9e9db452011-08-05 15:06:04 -0700243}
244
Boaz Harroshb14f8ab2008-10-27 18:27:55 +0200245#endif