Linus Torvalds | 96c57ad | 2014-04-12 15:39:53 -0700 | [diff] [blame] | 1 | #include <linux/ceph/ceph_debug.h> |
Sage Weil | 8f4e91d | 2009-10-06 11:31:14 -0700 | [diff] [blame] | 2 | #include <linux/in.h> |
| 3 | |
Sage Weil | 8f4e91d | 2009-10-06 11:31:14 -0700 | [diff] [blame] | 4 | #include "super.h" |
Yehuda Sadeh | 3d14c5d | 2010-04-06 15:14:15 -0700 | [diff] [blame] | 5 | #include "mds_client.h" |
Yehuda Sadeh | 3d14c5d | 2010-04-06 15:14:15 -0700 | [diff] [blame] | 6 | #include "ioctl.h" |
Sage Weil | 8f4e91d | 2009-10-06 11:31:14 -0700 | [diff] [blame] | 7 | |
| 8 | |
| 9 | /* |
| 10 | * ioctls |
| 11 | */ |
| 12 | |
| 13 | /* |
| 14 | * get and set the file layout |
| 15 | */ |
| 16 | static long ceph_ioctl_get_layout(struct file *file, void __user *arg) |
| 17 | { |
Al Viro | 496ad9a | 2013-01-23 17:07:38 -0500 | [diff] [blame] | 18 | struct ceph_inode_info *ci = ceph_inode(file_inode(file)); |
Sage Weil | 8f4e91d | 2009-10-06 11:31:14 -0700 | [diff] [blame] | 19 | struct ceph_ioctl_layout l; |
| 20 | int err; |
| 21 | |
Al Viro | 496ad9a | 2013-01-23 17:07:38 -0500 | [diff] [blame] | 22 | err = ceph_do_getattr(file_inode(file), CEPH_STAT_CAP_LAYOUT); |
Sage Weil | 8f4e91d | 2009-10-06 11:31:14 -0700 | [diff] [blame] | 23 | if (!err) { |
| 24 | l.stripe_unit = ceph_file_layout_su(ci->i_layout); |
| 25 | l.stripe_count = ceph_file_layout_stripe_count(ci->i_layout); |
| 26 | l.object_size = ceph_file_layout_object_size(ci->i_layout); |
| 27 | l.data_pool = le32_to_cpu(ci->i_layout.fl_pg_pool); |
Sage Weil | 3469ac1a | 2012-05-07 15:33:36 -0700 | [diff] [blame] | 28 | l.preferred_osd = (s32)-1; |
Sage Weil | 8f4e91d | 2009-10-06 11:31:14 -0700 | [diff] [blame] | 29 | if (copy_to_user(arg, &l, sizeof(l))) |
| 30 | return -EFAULT; |
| 31 | } |
| 32 | |
| 33 | return err; |
| 34 | } |
| 35 | |
Sage Weil | e49bf4c | 2012-05-07 15:34:35 -0700 | [diff] [blame] | 36 | static long __validate_layout(struct ceph_mds_client *mdsc, |
| 37 | struct ceph_ioctl_layout *l) |
| 38 | { |
| 39 | int i, err; |
| 40 | |
Sage Weil | e49bf4c | 2012-05-07 15:34:35 -0700 | [diff] [blame] | 41 | /* validate striping parameters */ |
| 42 | if ((l->object_size & ~PAGE_MASK) || |
| 43 | (l->stripe_unit & ~PAGE_MASK) || |
Sage Weil | 45f2e08 | 2012-08-21 12:11:51 -0700 | [diff] [blame] | 44 | (l->stripe_unit != 0 && |
| 45 | ((unsigned)l->object_size % (unsigned)l->stripe_unit))) |
Sage Weil | e49bf4c | 2012-05-07 15:34:35 -0700 | [diff] [blame] | 46 | return -EINVAL; |
| 47 | |
| 48 | /* make sure it's a valid data pool */ |
| 49 | mutex_lock(&mdsc->mutex); |
| 50 | err = -EINVAL; |
| 51 | for (i = 0; i < mdsc->mdsmap->m_num_data_pg_pools; i++) |
| 52 | if (mdsc->mdsmap->m_data_pg_pools[i] == l->data_pool) { |
| 53 | err = 0; |
| 54 | break; |
| 55 | } |
| 56 | mutex_unlock(&mdsc->mutex); |
| 57 | if (err) |
| 58 | return err; |
| 59 | |
| 60 | return 0; |
| 61 | } |
| 62 | |
Sage Weil | 8f4e91d | 2009-10-06 11:31:14 -0700 | [diff] [blame] | 63 | static long ceph_ioctl_set_layout(struct file *file, void __user *arg) |
| 64 | { |
Al Viro | 496ad9a | 2013-01-23 17:07:38 -0500 | [diff] [blame] | 65 | struct inode *inode = file_inode(file); |
Yehuda Sadeh | 3d14c5d | 2010-04-06 15:14:15 -0700 | [diff] [blame] | 66 | struct ceph_mds_client *mdsc = ceph_sb_to_client(inode->i_sb)->mdsc; |
Sage Weil | 8f4e91d | 2009-10-06 11:31:14 -0700 | [diff] [blame] | 67 | struct ceph_mds_request *req; |
| 68 | struct ceph_ioctl_layout l; |
Al Viro | 496ad9a | 2013-01-23 17:07:38 -0500 | [diff] [blame] | 69 | struct ceph_inode_info *ci = ceph_inode(file_inode(file)); |
Greg Farnum | a35eca9 | 2011-08-25 12:43:06 -0700 | [diff] [blame] | 70 | struct ceph_ioctl_layout nl; |
Sage Weil | e49bf4c | 2012-05-07 15:34:35 -0700 | [diff] [blame] | 71 | int err; |
Sage Weil | 8f4e91d | 2009-10-06 11:31:14 -0700 | [diff] [blame] | 72 | |
Sage Weil | 8f4e91d | 2009-10-06 11:31:14 -0700 | [diff] [blame] | 73 | if (copy_from_user(&l, arg, sizeof(l))) |
| 74 | return -EFAULT; |
| 75 | |
Greg Farnum | a35eca9 | 2011-08-25 12:43:06 -0700 | [diff] [blame] | 76 | /* validate changed params against current layout */ |
Al Viro | 496ad9a | 2013-01-23 17:07:38 -0500 | [diff] [blame] | 77 | err = ceph_do_getattr(file_inode(file), CEPH_STAT_CAP_LAYOUT); |
Sage Weil | 702aeb1 | 2012-05-14 12:34:38 -0700 | [diff] [blame] | 78 | if (err) |
Greg Farnum | a35eca9 | 2011-08-25 12:43:06 -0700 | [diff] [blame] | 79 | return err; |
| 80 | |
Sage Weil | 702aeb1 | 2012-05-14 12:34:38 -0700 | [diff] [blame] | 81 | memset(&nl, 0, sizeof(nl)); |
Greg Farnum | a35eca9 | 2011-08-25 12:43:06 -0700 | [diff] [blame] | 82 | if (l.stripe_count) |
| 83 | nl.stripe_count = l.stripe_count; |
Sage Weil | 702aeb1 | 2012-05-14 12:34:38 -0700 | [diff] [blame] | 84 | else |
| 85 | nl.stripe_count = ceph_file_layout_stripe_count(ci->i_layout); |
Greg Farnum | a35eca9 | 2011-08-25 12:43:06 -0700 | [diff] [blame] | 86 | if (l.stripe_unit) |
| 87 | nl.stripe_unit = l.stripe_unit; |
Sage Weil | 702aeb1 | 2012-05-14 12:34:38 -0700 | [diff] [blame] | 88 | else |
| 89 | nl.stripe_unit = ceph_file_layout_su(ci->i_layout); |
Greg Farnum | a35eca9 | 2011-08-25 12:43:06 -0700 | [diff] [blame] | 90 | if (l.object_size) |
| 91 | nl.object_size = l.object_size; |
Sage Weil | 702aeb1 | 2012-05-14 12:34:38 -0700 | [diff] [blame] | 92 | else |
| 93 | nl.object_size = ceph_file_layout_object_size(ci->i_layout); |
Greg Farnum | a35eca9 | 2011-08-25 12:43:06 -0700 | [diff] [blame] | 94 | if (l.data_pool) |
| 95 | nl.data_pool = l.data_pool; |
Sage Weil | 702aeb1 | 2012-05-14 12:34:38 -0700 | [diff] [blame] | 96 | else |
| 97 | nl.data_pool = ceph_file_layout_pg_pool(ci->i_layout); |
| 98 | |
| 99 | /* this is obsolete, and always -1 */ |
| 100 | nl.preferred_osd = le64_to_cpu(-1); |
Greg Farnum | a35eca9 | 2011-08-25 12:43:06 -0700 | [diff] [blame] | 101 | |
Sage Weil | e49bf4c | 2012-05-07 15:34:35 -0700 | [diff] [blame] | 102 | err = __validate_layout(mdsc, &nl); |
| 103 | if (err) |
| 104 | return err; |
Sage Weil | 8f4e91d | 2009-10-06 11:31:14 -0700 | [diff] [blame] | 105 | |
| 106 | req = ceph_mdsc_create_request(mdsc, CEPH_MDS_OP_SETLAYOUT, |
| 107 | USE_AUTH_MDS); |
| 108 | if (IS_ERR(req)) |
| 109 | return PTR_ERR(req); |
Sage Weil | 70b666c | 2011-05-27 09:24:26 -0700 | [diff] [blame] | 110 | req->r_inode = inode; |
| 111 | ihold(inode); |
Yan, Zheng | 3bd5814 | 2014-04-27 09:17:45 +0800 | [diff] [blame] | 112 | req->r_num_caps = 1; |
| 113 | |
Sage Weil | 8f4e91d | 2009-10-06 11:31:14 -0700 | [diff] [blame] | 114 | req->r_inode_drop = CEPH_CAP_FILE_SHARED | CEPH_CAP_FILE_EXCL; |
| 115 | |
| 116 | req->r_args.setlayout.layout.fl_stripe_unit = |
| 117 | cpu_to_le32(l.stripe_unit); |
| 118 | req->r_args.setlayout.layout.fl_stripe_count = |
| 119 | cpu_to_le32(l.stripe_count); |
| 120 | req->r_args.setlayout.layout.fl_object_size = |
| 121 | cpu_to_le32(l.object_size); |
| 122 | req->r_args.setlayout.layout.fl_pg_pool = cpu_to_le32(l.data_pool); |
Sage Weil | 8f4e91d | 2009-10-06 11:31:14 -0700 | [diff] [blame] | 123 | |
Sage Weil | 752c8bd | 2013-02-05 13:52:29 -0800 | [diff] [blame] | 124 | err = ceph_mdsc_do_request(mdsc, NULL, req); |
Sage Weil | 8f4e91d | 2009-10-06 11:31:14 -0700 | [diff] [blame] | 125 | ceph_mdsc_put_request(req); |
| 126 | return err; |
| 127 | } |
| 128 | |
| 129 | /* |
Greg Farnum | 571dba5 | 2010-09-24 14:56:40 -0700 | [diff] [blame] | 130 | * Set a layout policy on a directory inode. All items in the tree |
| 131 | * rooted at this inode will inherit this layout on creation, |
| 132 | * (It doesn't apply retroactively ) |
| 133 | * unless a subdirectory has its own layout policy. |
| 134 | */ |
| 135 | static long ceph_ioctl_set_layout_policy (struct file *file, void __user *arg) |
| 136 | { |
Al Viro | 496ad9a | 2013-01-23 17:07:38 -0500 | [diff] [blame] | 137 | struct inode *inode = file_inode(file); |
Greg Farnum | 571dba5 | 2010-09-24 14:56:40 -0700 | [diff] [blame] | 138 | struct ceph_mds_request *req; |
| 139 | struct ceph_ioctl_layout l; |
Sage Weil | e49bf4c | 2012-05-07 15:34:35 -0700 | [diff] [blame] | 140 | int err; |
Greg Farnum | 571dba5 | 2010-09-24 14:56:40 -0700 | [diff] [blame] | 141 | struct ceph_mds_client *mdsc = ceph_sb_to_client(inode->i_sb)->mdsc; |
| 142 | |
| 143 | /* copy and validate */ |
| 144 | if (copy_from_user(&l, arg, sizeof(l))) |
| 145 | return -EFAULT; |
| 146 | |
Sage Weil | e49bf4c | 2012-05-07 15:34:35 -0700 | [diff] [blame] | 147 | err = __validate_layout(mdsc, &l); |
| 148 | if (err) |
| 149 | return err; |
Greg Farnum | 571dba5 | 2010-09-24 14:56:40 -0700 | [diff] [blame] | 150 | |
| 151 | req = ceph_mdsc_create_request(mdsc, CEPH_MDS_OP_SETDIRLAYOUT, |
| 152 | USE_AUTH_MDS); |
| 153 | |
| 154 | if (IS_ERR(req)) |
| 155 | return PTR_ERR(req); |
Sage Weil | 70b666c | 2011-05-27 09:24:26 -0700 | [diff] [blame] | 156 | req->r_inode = inode; |
| 157 | ihold(inode); |
Yan, Zheng | 3bd5814 | 2014-04-27 09:17:45 +0800 | [diff] [blame] | 158 | req->r_num_caps = 1; |
Greg Farnum | 571dba5 | 2010-09-24 14:56:40 -0700 | [diff] [blame] | 159 | |
| 160 | req->r_args.setlayout.layout.fl_stripe_unit = |
| 161 | cpu_to_le32(l.stripe_unit); |
| 162 | req->r_args.setlayout.layout.fl_stripe_count = |
| 163 | cpu_to_le32(l.stripe_count); |
| 164 | req->r_args.setlayout.layout.fl_object_size = |
| 165 | cpu_to_le32(l.object_size); |
| 166 | req->r_args.setlayout.layout.fl_pg_pool = |
| 167 | cpu_to_le32(l.data_pool); |
Greg Farnum | 571dba5 | 2010-09-24 14:56:40 -0700 | [diff] [blame] | 168 | |
| 169 | err = ceph_mdsc_do_request(mdsc, inode, req); |
| 170 | ceph_mdsc_put_request(req); |
| 171 | return err; |
| 172 | } |
| 173 | |
| 174 | /* |
Sage Weil | 8f4e91d | 2009-10-06 11:31:14 -0700 | [diff] [blame] | 175 | * Return object name, size/offset information, and location (OSD |
| 176 | * number, network address) for a given file offset. |
| 177 | */ |
| 178 | static long ceph_ioctl_get_dataloc(struct file *file, void __user *arg) |
| 179 | { |
| 180 | struct ceph_ioctl_dataloc dl; |
Al Viro | 496ad9a | 2013-01-23 17:07:38 -0500 | [diff] [blame] | 181 | struct inode *inode = file_inode(file); |
Sage Weil | 8f4e91d | 2009-10-06 11:31:14 -0700 | [diff] [blame] | 182 | struct ceph_inode_info *ci = ceph_inode(inode); |
Yehuda Sadeh | 3d14c5d | 2010-04-06 15:14:15 -0700 | [diff] [blame] | 183 | struct ceph_osd_client *osdc = |
| 184 | &ceph_sb_to_client(inode->i_sb)->client->osdc; |
Ilya Dryomov | 7c13cb6 | 2014-01-27 17:40:19 +0200 | [diff] [blame] | 185 | struct ceph_object_locator oloc; |
| 186 | struct ceph_object_id oid; |
Sage Weil | 8f4e91d | 2009-10-06 11:31:14 -0700 | [diff] [blame] | 187 | u64 len = 1, olen; |
| 188 | u64 tmp; |
Sage Weil | 5104212 | 2009-11-04 11:39:12 -0800 | [diff] [blame] | 189 | struct ceph_pg pgid; |
Sage Weil | 457712a | 2012-09-24 21:04:57 -0700 | [diff] [blame] | 190 | int r; |
Sage Weil | 8f4e91d | 2009-10-06 11:31:14 -0700 | [diff] [blame] | 191 | |
| 192 | /* copy and validate */ |
| 193 | if (copy_from_user(&dl, arg, sizeof(dl))) |
| 194 | return -EFAULT; |
| 195 | |
| 196 | down_read(&osdc->map_sem); |
Alex Elder | e8afad6 | 2012-11-14 09:38:19 -0600 | [diff] [blame] | 197 | r = ceph_calc_file_object_mapping(&ci->i_layout, dl.file_offset, len, |
Sage Weil | 457712a | 2012-09-24 21:04:57 -0700 | [diff] [blame] | 198 | &dl.object_no, &dl.object_offset, |
| 199 | &olen); |
majianpeng | 494ddd1 | 2013-07-16 19:36:21 +0800 | [diff] [blame] | 200 | if (r < 0) { |
| 201 | up_read(&osdc->map_sem); |
Sage Weil | 457712a | 2012-09-24 21:04:57 -0700 | [diff] [blame] | 202 | return -EIO; |
majianpeng | 494ddd1 | 2013-07-16 19:36:21 +0800 | [diff] [blame] | 203 | } |
Sage Weil | 8f4e91d | 2009-10-06 11:31:14 -0700 | [diff] [blame] | 204 | dl.file_offset -= dl.object_offset; |
| 205 | dl.object_size = ceph_file_layout_object_size(ci->i_layout); |
| 206 | dl.block_size = ceph_file_layout_su(ci->i_layout); |
| 207 | |
| 208 | /* block_offset = object_offset % block_size */ |
| 209 | tmp = dl.object_offset; |
| 210 | dl.block_offset = do_div(tmp, dl.block_size); |
| 211 | |
| 212 | snprintf(dl.object_name, sizeof(dl.object_name), "%llx.%08llx", |
| 213 | ceph_ino(inode), dl.object_no); |
Alex Elder | 41766f8 | 2013-03-01 18:00:15 -0600 | [diff] [blame] | 214 | |
Ilya Dryomov | 7c13cb6 | 2014-01-27 17:40:19 +0200 | [diff] [blame] | 215 | oloc.pool = ceph_file_layout_pg_pool(ci->i_layout); |
| 216 | ceph_oid_set_name(&oid, dl.object_name); |
| 217 | |
| 218 | r = ceph_oloc_oid_to_pg(osdc->osdmap, &oloc, &oid, &pgid); |
majianpeng | 2fbcbff | 2013-08-02 18:14:48 +0800 | [diff] [blame] | 219 | if (r < 0) { |
| 220 | up_read(&osdc->map_sem); |
| 221 | return r; |
| 222 | } |
Sage Weil | 8f4e91d | 2009-10-06 11:31:14 -0700 | [diff] [blame] | 223 | |
Sage Weil | 8f4e91d | 2009-10-06 11:31:14 -0700 | [diff] [blame] | 224 | dl.osd = ceph_calc_pg_primary(osdc->osdmap, pgid); |
| 225 | if (dl.osd >= 0) { |
| 226 | struct ceph_entity_addr *a = |
| 227 | ceph_osd_addr(osdc->osdmap, dl.osd); |
| 228 | if (a) |
| 229 | memcpy(&dl.osd_addr, &a->in_addr, sizeof(dl.osd_addr)); |
| 230 | } else { |
| 231 | memset(&dl.osd_addr, 0, sizeof(dl.osd_addr)); |
| 232 | } |
| 233 | up_read(&osdc->map_sem); |
| 234 | |
| 235 | /* send result back to user */ |
| 236 | if (copy_to_user(arg, &dl, sizeof(dl))) |
| 237 | return -EFAULT; |
| 238 | |
| 239 | return 0; |
| 240 | } |
| 241 | |
Sage Weil | 8c6e922 | 2010-04-16 09:53:43 -0700 | [diff] [blame] | 242 | static long ceph_ioctl_lazyio(struct file *file) |
| 243 | { |
| 244 | struct ceph_file_info *fi = file->private_data; |
Al Viro | 496ad9a | 2013-01-23 17:07:38 -0500 | [diff] [blame] | 245 | struct inode *inode = file_inode(file); |
Sage Weil | 8c6e922 | 2010-04-16 09:53:43 -0700 | [diff] [blame] | 246 | struct ceph_inode_info *ci = ceph_inode(inode); |
| 247 | |
| 248 | if ((fi->fmode & CEPH_FILE_MODE_LAZY) == 0) { |
Sage Weil | be65559 | 2011-11-30 09:47:09 -0800 | [diff] [blame] | 249 | spin_lock(&ci->i_ceph_lock); |
Sage Weil | 8c6e922 | 2010-04-16 09:53:43 -0700 | [diff] [blame] | 250 | ci->i_nr_by_mode[fi->fmode]--; |
| 251 | fi->fmode |= CEPH_FILE_MODE_LAZY; |
| 252 | ci->i_nr_by_mode[fi->fmode]++; |
Sage Weil | be65559 | 2011-11-30 09:47:09 -0800 | [diff] [blame] | 253 | spin_unlock(&ci->i_ceph_lock); |
Sage Weil | 8c6e922 | 2010-04-16 09:53:43 -0700 | [diff] [blame] | 254 | dout("ioctl_layzio: file %p marked lazy\n", file); |
| 255 | |
| 256 | ceph_check_caps(ci, 0, NULL); |
| 257 | } else { |
| 258 | dout("ioctl_layzio: file %p already lazy\n", file); |
| 259 | } |
| 260 | return 0; |
| 261 | } |
| 262 | |
Sage Weil | 4918b6d | 2011-07-26 11:26:07 -0700 | [diff] [blame] | 263 | static long ceph_ioctl_syncio(struct file *file) |
| 264 | { |
| 265 | struct ceph_file_info *fi = file->private_data; |
| 266 | |
| 267 | fi->flags |= CEPH_F_SYNC; |
| 268 | return 0; |
| 269 | } |
| 270 | |
Sage Weil | 8f4e91d | 2009-10-06 11:31:14 -0700 | [diff] [blame] | 271 | long ceph_ioctl(struct file *file, unsigned int cmd, unsigned long arg) |
| 272 | { |
| 273 | dout("ioctl file %p cmd %u arg %lu\n", file, cmd, arg); |
| 274 | switch (cmd) { |
| 275 | case CEPH_IOC_GET_LAYOUT: |
| 276 | return ceph_ioctl_get_layout(file, (void __user *)arg); |
| 277 | |
| 278 | case CEPH_IOC_SET_LAYOUT: |
| 279 | return ceph_ioctl_set_layout(file, (void __user *)arg); |
| 280 | |
Greg Farnum | 571dba5 | 2010-09-24 14:56:40 -0700 | [diff] [blame] | 281 | case CEPH_IOC_SET_LAYOUT_POLICY: |
| 282 | return ceph_ioctl_set_layout_policy(file, (void __user *)arg); |
| 283 | |
Sage Weil | 8f4e91d | 2009-10-06 11:31:14 -0700 | [diff] [blame] | 284 | case CEPH_IOC_GET_DATALOC: |
| 285 | return ceph_ioctl_get_dataloc(file, (void __user *)arg); |
Sage Weil | 8c6e922 | 2010-04-16 09:53:43 -0700 | [diff] [blame] | 286 | |
| 287 | case CEPH_IOC_LAZYIO: |
| 288 | return ceph_ioctl_lazyio(file); |
Sage Weil | 4918b6d | 2011-07-26 11:26:07 -0700 | [diff] [blame] | 289 | |
| 290 | case CEPH_IOC_SYNCIO: |
| 291 | return ceph_ioctl_syncio(file); |
Sage Weil | 8f4e91d | 2009-10-06 11:31:14 -0700 | [diff] [blame] | 292 | } |
Greg Farnum | 571dba5 | 2010-09-24 14:56:40 -0700 | [diff] [blame] | 293 | |
Sage Weil | 8f4e91d | 2009-10-06 11:31:14 -0700 | [diff] [blame] | 294 | return -ENOTTY; |
| 295 | } |