| /* |
| * (C) 2001 Clemson University and The University of Chicago |
| * |
| * See COPYING in top-level directory. |
| */ |
| #include "protocol.h" |
| #include "orangefs-kernel.h" |
| #include "orangefs-dev-proto.h" |
| #include "orangefs-bufmap.h" |
| |
| __s32 fsid_of_op(struct orangefs_kernel_op_s *op) |
| { |
| __s32 fsid = ORANGEFS_FS_ID_NULL; |
| |
| if (op) { |
| switch (op->upcall.type) { |
| case ORANGEFS_VFS_OP_FILE_IO: |
| fsid = op->upcall.req.io.refn.fs_id; |
| break; |
| case ORANGEFS_VFS_OP_LOOKUP: |
| fsid = op->upcall.req.lookup.parent_refn.fs_id; |
| break; |
| case ORANGEFS_VFS_OP_CREATE: |
| fsid = op->upcall.req.create.parent_refn.fs_id; |
| break; |
| case ORANGEFS_VFS_OP_GETATTR: |
| fsid = op->upcall.req.getattr.refn.fs_id; |
| break; |
| case ORANGEFS_VFS_OP_REMOVE: |
| fsid = op->upcall.req.remove.parent_refn.fs_id; |
| break; |
| case ORANGEFS_VFS_OP_MKDIR: |
| fsid = op->upcall.req.mkdir.parent_refn.fs_id; |
| break; |
| case ORANGEFS_VFS_OP_READDIR: |
| fsid = op->upcall.req.readdir.refn.fs_id; |
| break; |
| case ORANGEFS_VFS_OP_SETATTR: |
| fsid = op->upcall.req.setattr.refn.fs_id; |
| break; |
| case ORANGEFS_VFS_OP_SYMLINK: |
| fsid = op->upcall.req.sym.parent_refn.fs_id; |
| break; |
| case ORANGEFS_VFS_OP_RENAME: |
| fsid = op->upcall.req.rename.old_parent_refn.fs_id; |
| break; |
| case ORANGEFS_VFS_OP_STATFS: |
| fsid = op->upcall.req.statfs.fs_id; |
| break; |
| case ORANGEFS_VFS_OP_TRUNCATE: |
| fsid = op->upcall.req.truncate.refn.fs_id; |
| break; |
| case ORANGEFS_VFS_OP_MMAP_RA_FLUSH: |
| fsid = op->upcall.req.ra_cache_flush.refn.fs_id; |
| break; |
| case ORANGEFS_VFS_OP_FS_UMOUNT: |
| fsid = op->upcall.req.fs_umount.fs_id; |
| break; |
| case ORANGEFS_VFS_OP_GETXATTR: |
| fsid = op->upcall.req.getxattr.refn.fs_id; |
| break; |
| case ORANGEFS_VFS_OP_SETXATTR: |
| fsid = op->upcall.req.setxattr.refn.fs_id; |
| break; |
| case ORANGEFS_VFS_OP_LISTXATTR: |
| fsid = op->upcall.req.listxattr.refn.fs_id; |
| break; |
| case ORANGEFS_VFS_OP_REMOVEXATTR: |
| fsid = op->upcall.req.removexattr.refn.fs_id; |
| break; |
| case ORANGEFS_VFS_OP_FSYNC: |
| fsid = op->upcall.req.fsync.refn.fs_id; |
| break; |
| default: |
| break; |
| } |
| } |
| return fsid; |
| } |
| |
| static int orangefs_inode_flags(struct ORANGEFS_sys_attr_s *attrs) |
| { |
| int flags = 0; |
| if (attrs->flags & ORANGEFS_IMMUTABLE_FL) |
| flags |= S_IMMUTABLE; |
| else |
| flags &= ~S_IMMUTABLE; |
| if (attrs->flags & ORANGEFS_APPEND_FL) |
| flags |= S_APPEND; |
| else |
| flags &= ~S_APPEND; |
| if (attrs->flags & ORANGEFS_NOATIME_FL) |
| flags |= S_NOATIME; |
| else |
| flags &= ~S_NOATIME; |
| return flags; |
| } |
| |
| static int orangefs_inode_perms(struct ORANGEFS_sys_attr_s *attrs) |
| { |
| int perm_mode = 0; |
| |
| if (attrs->perms & ORANGEFS_O_EXECUTE) |
| perm_mode |= S_IXOTH; |
| if (attrs->perms & ORANGEFS_O_WRITE) |
| perm_mode |= S_IWOTH; |
| if (attrs->perms & ORANGEFS_O_READ) |
| perm_mode |= S_IROTH; |
| |
| if (attrs->perms & ORANGEFS_G_EXECUTE) |
| perm_mode |= S_IXGRP; |
| if (attrs->perms & ORANGEFS_G_WRITE) |
| perm_mode |= S_IWGRP; |
| if (attrs->perms & ORANGEFS_G_READ) |
| perm_mode |= S_IRGRP; |
| |
| if (attrs->perms & ORANGEFS_U_EXECUTE) |
| perm_mode |= S_IXUSR; |
| if (attrs->perms & ORANGEFS_U_WRITE) |
| perm_mode |= S_IWUSR; |
| if (attrs->perms & ORANGEFS_U_READ) |
| perm_mode |= S_IRUSR; |
| |
| if (attrs->perms & ORANGEFS_G_SGID) |
| perm_mode |= S_ISGID; |
| if (attrs->perms & ORANGEFS_U_SUID) |
| perm_mode |= S_ISUID; |
| |
| return perm_mode; |
| } |
| |
| /* NOTE: symname is ignored unless the inode is a sym link */ |
| static int copy_attributes_to_inode(struct inode *inode, |
| struct ORANGEFS_sys_attr_s *attrs, |
| char *symname) |
| { |
| int ret = -1; |
| struct orangefs_inode_s *orangefs_inode = ORANGEFS_I(inode); |
| loff_t inode_size = 0; |
| loff_t rounded_up_size = 0; |
| |
| |
| /* |
| * arbitrarily set the inode block size; FIXME: we need to |
| * resolve the difference between the reported inode blocksize |
| * and the PAGE_CACHE_SIZE, since our block count will always |
| * be wrong. |
| * |
| * For now, we're setting the block count to be the proper |
| * number assuming the block size is 512 bytes, and the size is |
| * rounded up to the nearest 4K. This is apparently required |
| * to get proper size reports from the 'du' shell utility. |
| * |
| * changing the inode->i_blkbits to something other than |
| * PAGE_CACHE_SHIFT breaks mmap/execution as we depend on that. |
| */ |
| gossip_debug(GOSSIP_UTILS_DEBUG, |
| "attrs->mask = %x (objtype = %s)\n", |
| attrs->mask, |
| attrs->objtype == ORANGEFS_TYPE_METAFILE ? "file" : |
| attrs->objtype == ORANGEFS_TYPE_DIRECTORY ? "directory" : |
| attrs->objtype == ORANGEFS_TYPE_SYMLINK ? "symlink" : |
| "invalid/unknown"); |
| |
| switch (attrs->objtype) { |
| case ORANGEFS_TYPE_METAFILE: |
| inode->i_flags = orangefs_inode_flags(attrs); |
| if (attrs->mask & ORANGEFS_ATTR_SYS_SIZE) { |
| inode_size = (loff_t) attrs->size; |
| rounded_up_size = |
| (inode_size + (4096 - (inode_size % 4096))); |
| |
| spin_lock(&inode->i_lock); |
| inode->i_bytes = inode_size; |
| inode->i_blocks = |
| (unsigned long)(rounded_up_size / 512); |
| spin_unlock(&inode->i_lock); |
| |
| /* |
| * NOTE: make sure all the places we're called |
| * from have the inode->i_sem lock. We're fine |
| * in 99% of the cases since we're mostly |
| * called from a lookup. |
| */ |
| inode->i_size = inode_size; |
| } |
| break; |
| case ORANGEFS_TYPE_SYMLINK: |
| if (symname != NULL) { |
| inode->i_size = (loff_t) strlen(symname); |
| break; |
| } |
| /*FALLTHRU*/ |
| default: |
| inode->i_size = PAGE_CACHE_SIZE; |
| |
| spin_lock(&inode->i_lock); |
| inode_set_bytes(inode, inode->i_size); |
| spin_unlock(&inode->i_lock); |
| break; |
| } |
| |
| inode->i_uid = make_kuid(&init_user_ns, attrs->owner); |
| inode->i_gid = make_kgid(&init_user_ns, attrs->group); |
| inode->i_atime.tv_sec = (time64_t) attrs->atime; |
| inode->i_mtime.tv_sec = (time64_t) attrs->mtime; |
| inode->i_ctime.tv_sec = (time64_t) attrs->ctime; |
| inode->i_atime.tv_nsec = 0; |
| inode->i_mtime.tv_nsec = 0; |
| inode->i_ctime.tv_nsec = 0; |
| |
| inode->i_mode = orangefs_inode_perms(attrs); |
| |
| if (is_root_handle(inode)) { |
| /* special case: mark the root inode as sticky */ |
| inode->i_mode |= S_ISVTX; |
| gossip_debug(GOSSIP_UTILS_DEBUG, |
| "Marking inode %pU as sticky\n", |
| get_khandle_from_ino(inode)); |
| } |
| |
| switch (attrs->objtype) { |
| case ORANGEFS_TYPE_METAFILE: |
| inode->i_mode |= S_IFREG; |
| ret = 0; |
| break; |
| case ORANGEFS_TYPE_DIRECTORY: |
| inode->i_mode |= S_IFDIR; |
| /* NOTE: we have no good way to keep nlink consistent |
| * for directories across clients; keep constant at 1. |
| * Why 1? If we go with 2, then find(1) gets confused |
| * and won't work properly withouth the -noleaf option |
| */ |
| set_nlink(inode, 1); |
| ret = 0; |
| break; |
| case ORANGEFS_TYPE_SYMLINK: |
| inode->i_mode |= S_IFLNK; |
| |
| /* copy link target to inode private data */ |
| if (orangefs_inode && symname) { |
| strncpy(orangefs_inode->link_target, |
| symname, |
| ORANGEFS_NAME_MAX); |
| gossip_debug(GOSSIP_UTILS_DEBUG, |
| "Copied attr link target %s\n", |
| orangefs_inode->link_target); |
| } |
| gossip_debug(GOSSIP_UTILS_DEBUG, |
| "symlink mode %o\n", |
| inode->i_mode); |
| ret = 0; |
| break; |
| default: |
| gossip_err("orangefs: copy_attributes_to_inode: got invalid attribute type %x\n", |
| attrs->objtype); |
| } |
| |
| gossip_debug(GOSSIP_UTILS_DEBUG, |
| "orangefs: copy_attributes_to_inode: setting i_mode to %o, i_size to %lu\n", |
| inode->i_mode, |
| (unsigned long)i_size_read(inode)); |
| |
| return ret; |
| } |
| |
| /* |
| * NOTE: in kernel land, we never use the sys_attr->link_target for |
| * anything, so don't bother copying it into the sys_attr object here. |
| */ |
| static inline int copy_attributes_from_inode(struct inode *inode, |
| struct ORANGEFS_sys_attr_s *attrs, |
| struct iattr *iattr) |
| { |
| umode_t tmp_mode; |
| |
| if (!iattr || !inode || !attrs) { |
| gossip_err("NULL iattr (%p), inode (%p), attrs (%p) " |
| "in copy_attributes_from_inode!\n", |
| iattr, |
| inode, |
| attrs); |
| return -EINVAL; |
| } |
| /* |
| * We need to be careful to only copy the attributes out of the |
| * iattr object that we know are valid. |
| */ |
| attrs->mask = 0; |
| if (iattr->ia_valid & ATTR_UID) { |
| attrs->owner = from_kuid(current_user_ns(), iattr->ia_uid); |
| attrs->mask |= ORANGEFS_ATTR_SYS_UID; |
| gossip_debug(GOSSIP_UTILS_DEBUG, "(UID) %d\n", attrs->owner); |
| } |
| if (iattr->ia_valid & ATTR_GID) { |
| attrs->group = from_kgid(current_user_ns(), iattr->ia_gid); |
| attrs->mask |= ORANGEFS_ATTR_SYS_GID; |
| gossip_debug(GOSSIP_UTILS_DEBUG, "(GID) %d\n", attrs->group); |
| } |
| |
| if (iattr->ia_valid & ATTR_ATIME) { |
| attrs->mask |= ORANGEFS_ATTR_SYS_ATIME; |
| if (iattr->ia_valid & ATTR_ATIME_SET) { |
| attrs->atime = (time64_t)iattr->ia_atime.tv_sec; |
| attrs->mask |= ORANGEFS_ATTR_SYS_ATIME_SET; |
| } |
| } |
| if (iattr->ia_valid & ATTR_MTIME) { |
| attrs->mask |= ORANGEFS_ATTR_SYS_MTIME; |
| if (iattr->ia_valid & ATTR_MTIME_SET) { |
| attrs->mtime = (time64_t)iattr->ia_mtime.tv_sec; |
| attrs->mask |= ORANGEFS_ATTR_SYS_MTIME_SET; |
| } |
| } |
| if (iattr->ia_valid & ATTR_CTIME) |
| attrs->mask |= ORANGEFS_ATTR_SYS_CTIME; |
| |
| /* |
| * ORANGEFS cannot set size with a setattr operation. Probably not likely |
| * to be requested through the VFS, but just in case, don't worry about |
| * ATTR_SIZE |
| */ |
| |
| if (iattr->ia_valid & ATTR_MODE) { |
| tmp_mode = iattr->ia_mode; |
| if (tmp_mode & (S_ISVTX)) { |
| if (is_root_handle(inode)) { |
| /* |
| * allow sticky bit to be set on root (since |
| * it shows up that way by default anyhow), |
| * but don't show it to the server |
| */ |
| tmp_mode -= S_ISVTX; |
| } else { |
| gossip_debug(GOSSIP_UTILS_DEBUG, |
| "User attempted to set sticky bit on non-root directory; returning EINVAL.\n"); |
| return -EINVAL; |
| } |
| } |
| |
| if (tmp_mode & (S_ISUID)) { |
| gossip_debug(GOSSIP_UTILS_DEBUG, |
| "Attempting to set setuid bit (not supported); returning EINVAL.\n"); |
| return -EINVAL; |
| } |
| |
| attrs->perms = ORANGEFS_util_translate_mode(tmp_mode); |
| attrs->mask |= ORANGEFS_ATTR_SYS_PERM; |
| } |
| |
| return 0; |
| } |
| |
| static int compare_attributes_to_inode(struct inode *inode, |
| struct ORANGEFS_sys_attr_s *attrs, |
| char *symname, |
| int mask) |
| { |
| struct orangefs_inode_s *orangefs_inode = ORANGEFS_I(inode); |
| loff_t inode_size, rounded_up_size; |
| |
| /* Much of what happens below relies on the type being around. */ |
| if (!(mask & ORANGEFS_ATTR_SYS_TYPE)) |
| return 0; |
| |
| if (attrs->objtype == ORANGEFS_TYPE_METAFILE && |
| inode->i_flags != orangefs_inode_flags(attrs)) |
| return 0; |
| |
| /* Compare file size. */ |
| |
| switch (attrs->objtype) { |
| case ORANGEFS_TYPE_METAFILE: |
| if (mask & ORANGEFS_ATTR_SYS_SIZE) { |
| inode_size = attrs->size; |
| rounded_up_size = inode_size + |
| (4096 - (inode_size % 4096)); |
| if (inode->i_bytes != inode_size || |
| inode->i_blocks != rounded_up_size/512) |
| return 0; |
| } |
| break; |
| case ORANGEFS_TYPE_SYMLINK: |
| if (mask & ORANGEFS_ATTR_SYS_SIZE) |
| if (symname && strlen(symname) != inode->i_size) |
| return 0; |
| break; |
| default: |
| if (inode->i_size != PAGE_CACHE_SIZE && |
| inode_get_bytes(inode) != PAGE_CACHE_SIZE) |
| return 0; |
| } |
| |
| /* Compare general attributes. */ |
| |
| if (mask & ORANGEFS_ATTR_SYS_UID && |
| !uid_eq(inode->i_uid, make_kuid(&init_user_ns, attrs->owner))) |
| return 0; |
| if (mask & ORANGEFS_ATTR_SYS_GID && |
| !gid_eq(inode->i_gid, make_kgid(&init_user_ns, attrs->group))) |
| return 0; |
| if (mask & ORANGEFS_ATTR_SYS_ATIME && |
| inode->i_atime.tv_sec != attrs->atime) |
| return 0; |
| if (mask & ORANGEFS_ATTR_SYS_MTIME && |
| inode->i_atime.tv_sec != attrs->mtime) |
| return 0; |
| if (mask & ORANGEFS_ATTR_SYS_CTIME && |
| inode->i_atime.tv_sec != attrs->ctime) |
| return 0; |
| if (inode->i_atime.tv_nsec != 0 || |
| inode->i_mtime.tv_nsec != 0 || |
| inode->i_ctime.tv_nsec != 0) |
| return 0; |
| |
| if (mask & ORANGEFS_ATTR_SYS_PERM && |
| (inode->i_mode & ~(S_ISVTX|S_IFREG|S_IFDIR|S_IFLNK)) != |
| orangefs_inode_perms(attrs)) |
| return 0; |
| |
| if (is_root_handle(inode)) |
| if (!(inode->i_mode & S_ISVTX)) |
| return 0; |
| |
| /* Compare file type. */ |
| |
| switch (attrs->objtype) { |
| case ORANGEFS_TYPE_METAFILE: |
| if (!S_ISREG(inode->i_mode)) |
| return 0; |
| break; |
| case ORANGEFS_TYPE_DIRECTORY: |
| if (!S_ISDIR(inode->i_mode)) |
| return 0; |
| if (inode->i_nlink != 1) |
| return 0; |
| break; |
| case ORANGEFS_TYPE_SYMLINK: |
| if (!S_ISLNK(inode->i_mode)) |
| return 0; |
| if (orangefs_inode && symname && |
| mask & ORANGEFS_ATTR_SYS_LNK_TARGET) |
| if (strcmp(orangefs_inode->link_target, symname)) |
| return 0; |
| break; |
| default: |
| gossip_err("orangefs: compare_attributes_to_inode: got invalid attribute type %x\n", |
| attrs->objtype); |
| |
| } |
| |
| return 1; |
| } |
| |
| /* |
| * Issues a orangefs getattr request and fills in the appropriate inode |
| * attributes if successful. When check is 0, returns 0 on success and -errno |
| * otherwise. When check is 1, returns 1 on success where the inode is valid |
| * and 0 on success where the inode is stale and -errno otherwise. |
| */ |
| int orangefs_inode_getattr(struct inode *inode, __u32 getattr_mask, int check) |
| { |
| struct orangefs_inode_s *orangefs_inode = ORANGEFS_I(inode); |
| struct orangefs_kernel_op_s *new_op; |
| int ret = -EINVAL; |
| |
| gossip_debug(GOSSIP_UTILS_DEBUG, |
| "%s: called on inode %pU\n", |
| __func__, |
| get_khandle_from_ino(inode)); |
| |
| new_op = op_alloc(ORANGEFS_VFS_OP_GETATTR); |
| if (!new_op) |
| return -ENOMEM; |
| new_op->upcall.req.getattr.refn = orangefs_inode->refn; |
| new_op->upcall.req.getattr.mask = getattr_mask; |
| |
| ret = service_operation(new_op, __func__, |
| get_interruptible_flag(inode)); |
| if (ret != 0) |
| goto out; |
| |
| if (check) { |
| ret = compare_attributes_to_inode(inode, |
| &new_op->downcall.resp.getattr.attributes, |
| new_op->downcall.resp.getattr.link_target, |
| getattr_mask); |
| |
| if (new_op->downcall.resp.getattr.attributes.objtype == |
| ORANGEFS_TYPE_METAFILE) { |
| if (orangefs_inode->blksize != |
| new_op->downcall.resp.getattr.attributes.blksize) |
| ret = 0; |
| } else { |
| if (orangefs_inode->blksize != 1 << inode->i_blkbits) |
| ret = 0; |
| } |
| } else { |
| if (copy_attributes_to_inode(inode, |
| &new_op->downcall.resp.getattr.attributes, |
| new_op->downcall.resp.getattr.link_target)) { |
| gossip_err("%s: failed to copy attributes\n", __func__); |
| ret = -ENOENT; |
| goto out; |
| } |
| |
| /* |
| * Store blksize in orangefs specific part of inode structure; |
| * we are only going to use this to report to stat to make sure |
| * it doesn't perturb any inode related code paths. |
| */ |
| if (new_op->downcall.resp.getattr.attributes.objtype == |
| ORANGEFS_TYPE_METAFILE) { |
| orangefs_inode->blksize = new_op->downcall.resp. |
| getattr.attributes.blksize; |
| } else { |
| /* |
| * mimic behavior of generic_fillattr() for other file |
| * types. |
| */ |
| orangefs_inode->blksize = (1 << inode->i_blkbits); |
| |
| } |
| } |
| |
| out: |
| gossip_debug(GOSSIP_UTILS_DEBUG, |
| "Getattr on handle %pU, " |
| "fsid %d\n (inode ct = %d) returned %d\n", |
| &orangefs_inode->refn.khandle, |
| orangefs_inode->refn.fs_id, |
| (int)atomic_read(&inode->i_count), |
| ret); |
| |
| op_release(new_op); |
| return ret; |
| } |
| |
| /* |
| * issues a orangefs setattr request to make sure the new attribute values |
| * take effect if successful. returns 0 on success; -errno otherwise |
| */ |
| int orangefs_inode_setattr(struct inode *inode, struct iattr *iattr) |
| { |
| struct orangefs_inode_s *orangefs_inode = ORANGEFS_I(inode); |
| struct orangefs_kernel_op_s *new_op; |
| int ret; |
| |
| new_op = op_alloc(ORANGEFS_VFS_OP_SETATTR); |
| if (!new_op) |
| return -ENOMEM; |
| |
| new_op->upcall.req.setattr.refn = orangefs_inode->refn; |
| ret = copy_attributes_from_inode(inode, |
| &new_op->upcall.req.setattr.attributes, |
| iattr); |
| if (ret >= 0) { |
| ret = service_operation(new_op, __func__, |
| get_interruptible_flag(inode)); |
| |
| gossip_debug(GOSSIP_UTILS_DEBUG, |
| "orangefs_inode_setattr: returning %d\n", |
| ret); |
| } |
| |
| op_release(new_op); |
| |
| /* |
| * successful setattr should clear the atime, mtime and |
| * ctime flags. |
| */ |
| if (ret == 0) { |
| ClearAtimeFlag(orangefs_inode); |
| ClearMtimeFlag(orangefs_inode); |
| ClearCtimeFlag(orangefs_inode); |
| ClearModeFlag(orangefs_inode); |
| } |
| |
| return ret; |
| } |
| |
| int orangefs_flush_inode(struct inode *inode) |
| { |
| /* |
| * If it is a dirty inode, this function gets called. |
| * Gather all the information that needs to be setattr'ed |
| * Right now, this will only be used for mode, atime, mtime |
| * and/or ctime. |
| */ |
| struct iattr wbattr; |
| int ret; |
| int mtime_flag; |
| int ctime_flag; |
| int atime_flag; |
| int mode_flag; |
| struct orangefs_inode_s *orangefs_inode = ORANGEFS_I(inode); |
| |
| memset(&wbattr, 0, sizeof(wbattr)); |
| |
| /* |
| * check inode flags up front, and clear them if they are set. This |
| * will prevent multiple processes from all trying to flush the same |
| * inode if they call close() simultaneously |
| */ |
| mtime_flag = MtimeFlag(orangefs_inode); |
| ClearMtimeFlag(orangefs_inode); |
| ctime_flag = CtimeFlag(orangefs_inode); |
| ClearCtimeFlag(orangefs_inode); |
| atime_flag = AtimeFlag(orangefs_inode); |
| ClearAtimeFlag(orangefs_inode); |
| mode_flag = ModeFlag(orangefs_inode); |
| ClearModeFlag(orangefs_inode); |
| |
| /* -- Lazy atime,mtime and ctime update -- |
| * Note: all times are dictated by server in the new scheme |
| * and not by the clients |
| * |
| * Also mode updates are being handled now.. |
| */ |
| |
| if (mtime_flag) |
| wbattr.ia_valid |= ATTR_MTIME; |
| if (ctime_flag) |
| wbattr.ia_valid |= ATTR_CTIME; |
| if (atime_flag) |
| wbattr.ia_valid |= ATTR_ATIME; |
| |
| if (mode_flag) { |
| wbattr.ia_mode = inode->i_mode; |
| wbattr.ia_valid |= ATTR_MODE; |
| } |
| |
| gossip_debug(GOSSIP_UTILS_DEBUG, |
| "*********** orangefs_flush_inode: %pU " |
| "(ia_valid %d)\n", |
| get_khandle_from_ino(inode), |
| wbattr.ia_valid); |
| if (wbattr.ia_valid == 0) { |
| gossip_debug(GOSSIP_UTILS_DEBUG, |
| "orangefs_flush_inode skipping setattr()\n"); |
| return 0; |
| } |
| |
| gossip_debug(GOSSIP_UTILS_DEBUG, |
| "orangefs_flush_inode (%pU) writing mode %o\n", |
| get_khandle_from_ino(inode), |
| inode->i_mode); |
| |
| ret = orangefs_inode_setattr(inode, &wbattr); |
| |
| return ret; |
| } |
| |
| int orangefs_unmount_sb(struct super_block *sb) |
| { |
| int ret = -EINVAL; |
| struct orangefs_kernel_op_s *new_op = NULL; |
| |
| gossip_debug(GOSSIP_UTILS_DEBUG, |
| "orangefs_unmount_sb called on sb %p\n", |
| sb); |
| |
| new_op = op_alloc(ORANGEFS_VFS_OP_FS_UMOUNT); |
| if (!new_op) |
| return -ENOMEM; |
| new_op->upcall.req.fs_umount.id = ORANGEFS_SB(sb)->id; |
| new_op->upcall.req.fs_umount.fs_id = ORANGEFS_SB(sb)->fs_id; |
| strncpy(new_op->upcall.req.fs_umount.orangefs_config_server, |
| ORANGEFS_SB(sb)->devname, |
| ORANGEFS_MAX_SERVER_ADDR_LEN); |
| |
| gossip_debug(GOSSIP_UTILS_DEBUG, |
| "Attempting ORANGEFS Unmount via host %s\n", |
| new_op->upcall.req.fs_umount.orangefs_config_server); |
| |
| ret = service_operation(new_op, "orangefs_fs_umount", 0); |
| |
| gossip_debug(GOSSIP_UTILS_DEBUG, |
| "orangefs_unmount: got return value of %d\n", ret); |
| if (ret) |
| sb = ERR_PTR(ret); |
| else |
| ORANGEFS_SB(sb)->mount_pending = 1; |
| |
| op_release(new_op); |
| return ret; |
| } |
| |
| void orangefs_make_bad_inode(struct inode *inode) |
| { |
| if (is_root_handle(inode)) { |
| /* |
| * if this occurs, the pvfs2-client-core was killed but we |
| * can't afford to lose the inode operations and such |
| * associated with the root handle in any case. |
| */ |
| gossip_debug(GOSSIP_UTILS_DEBUG, |
| "*** NOT making bad root inode %pU\n", |
| get_khandle_from_ino(inode)); |
| } else { |
| gossip_debug(GOSSIP_UTILS_DEBUG, |
| "*** making bad inode %pU\n", |
| get_khandle_from_ino(inode)); |
| make_bad_inode(inode); |
| } |
| } |
| |
| /* |
| * The following is a very dirty hack that is now a permanent part of the |
| * ORANGEFS protocol. See protocol.h for more error definitions. |
| */ |
| |
| /* The order matches include/orangefs-types.h in the OrangeFS source. */ |
| static int PINT_errno_mapping[] = { |
| 0, EPERM, ENOENT, EINTR, EIO, ENXIO, EBADF, EAGAIN, ENOMEM, |
| EFAULT, EBUSY, EEXIST, ENODEV, ENOTDIR, EISDIR, EINVAL, EMFILE, |
| EFBIG, ENOSPC, EROFS, EMLINK, EPIPE, EDEADLK, ENAMETOOLONG, |
| ENOLCK, ENOSYS, ENOTEMPTY, ELOOP, EWOULDBLOCK, ENOMSG, EUNATCH, |
| EBADR, EDEADLOCK, ENODATA, ETIME, ENONET, EREMOTE, ECOMM, |
| EPROTO, EBADMSG, EOVERFLOW, ERESTART, EMSGSIZE, EPROTOTYPE, |
| ENOPROTOOPT, EPROTONOSUPPORT, EOPNOTSUPP, EADDRINUSE, |
| EADDRNOTAVAIL, ENETDOWN, ENETUNREACH, ENETRESET, ENOBUFS, |
| ETIMEDOUT, ECONNREFUSED, EHOSTDOWN, EHOSTUNREACH, EALREADY, |
| EACCES, ECONNRESET, ERANGE |
| }; |
| |
| int orangefs_normalize_to_errno(__s32 error_code) |
| { |
| __u32 i; |
| |
| /* Success */ |
| if (error_code == 0) { |
| return 0; |
| /* |
| * This shouldn't ever happen. If it does it should be fixed on the |
| * server. |
| */ |
| } else if (error_code > 0) { |
| gossip_err("orangefs: error status receieved.\n"); |
| gossip_err("orangefs: assuming error code is inverted.\n"); |
| error_code = -error_code; |
| } |
| |
| /* |
| * XXX: This is very bad since error codes from ORANGEFS may not be |
| * suitable for return into userspace. |
| */ |
| |
| /* |
| * Convert ORANGEFS error values into errno values suitable for return |
| * from the kernel. |
| */ |
| if ((-error_code) & ORANGEFS_NON_ERRNO_ERROR_BIT) { |
| if (((-error_code) & |
| (ORANGEFS_ERROR_NUMBER_BITS|ORANGEFS_NON_ERRNO_ERROR_BIT| |
| ORANGEFS_ERROR_BIT)) == ORANGEFS_ECANCEL) { |
| /* |
| * cancellation error codes generally correspond to |
| * a timeout from the client's perspective |
| */ |
| error_code = -ETIMEDOUT; |
| } else { |
| /* assume a default error code */ |
| gossip_err("orangefs: warning: got error code without errno equivalent: %d.\n", error_code); |
| error_code = -EINVAL; |
| } |
| |
| /* Convert ORANGEFS encoded errno values into regular errno values. */ |
| } else if ((-error_code) & ORANGEFS_ERROR_BIT) { |
| i = (-error_code) & ~(ORANGEFS_ERROR_BIT|ORANGEFS_ERROR_CLASS_BITS); |
| if (i < sizeof(PINT_errno_mapping)/sizeof(*PINT_errno_mapping)) |
| error_code = -PINT_errno_mapping[i]; |
| else |
| error_code = -EINVAL; |
| |
| /* |
| * Only ORANGEFS protocol error codes should ever come here. Otherwise |
| * there is a bug somewhere. |
| */ |
| } else { |
| gossip_err("orangefs: orangefs_normalize_to_errno: got error code which is not from ORANGEFS.\n"); |
| } |
| return error_code; |
| } |
| |
| #define NUM_MODES 11 |
| __s32 ORANGEFS_util_translate_mode(int mode) |
| { |
| int ret = 0; |
| int i = 0; |
| static int modes[NUM_MODES] = { |
| S_IXOTH, S_IWOTH, S_IROTH, |
| S_IXGRP, S_IWGRP, S_IRGRP, |
| S_IXUSR, S_IWUSR, S_IRUSR, |
| S_ISGID, S_ISUID |
| }; |
| static int orangefs_modes[NUM_MODES] = { |
| ORANGEFS_O_EXECUTE, ORANGEFS_O_WRITE, ORANGEFS_O_READ, |
| ORANGEFS_G_EXECUTE, ORANGEFS_G_WRITE, ORANGEFS_G_READ, |
| ORANGEFS_U_EXECUTE, ORANGEFS_U_WRITE, ORANGEFS_U_READ, |
| ORANGEFS_G_SGID, ORANGEFS_U_SUID |
| }; |
| |
| for (i = 0; i < NUM_MODES; i++) |
| if (mode & modes[i]) |
| ret |= orangefs_modes[i]; |
| |
| return ret; |
| } |
| #undef NUM_MODES |
| |
| /* |
| * After obtaining a string representation of the client's debug |
| * keywords and their associated masks, this function is called to build an |
| * array of these values. |
| */ |
| int orangefs_prepare_cdm_array(char *debug_array_string) |
| { |
| int i; |
| int rc = -EINVAL; |
| char *cds_head = NULL; |
| char *cds_delimiter = NULL; |
| int keyword_len = 0; |
| |
| gossip_debug(GOSSIP_UTILS_DEBUG, "%s: start\n", __func__); |
| |
| /* |
| * figure out how many elements the cdm_array needs. |
| */ |
| for (i = 0; i < strlen(debug_array_string); i++) |
| if (debug_array_string[i] == '\n') |
| cdm_element_count++; |
| |
| if (!cdm_element_count) { |
| pr_info("No elements in client debug array string!\n"); |
| goto out; |
| } |
| |
| cdm_array = |
| kzalloc(cdm_element_count * sizeof(struct client_debug_mask), |
| GFP_KERNEL); |
| if (!cdm_array) { |
| pr_info("malloc failed for cdm_array!\n"); |
| rc = -ENOMEM; |
| goto out; |
| } |
| |
| cds_head = debug_array_string; |
| |
| for (i = 0; i < cdm_element_count; i++) { |
| cds_delimiter = strchr(cds_head, '\n'); |
| *cds_delimiter = '\0'; |
| |
| keyword_len = strcspn(cds_head, " "); |
| |
| cdm_array[i].keyword = kzalloc(keyword_len + 1, GFP_KERNEL); |
| if (!cdm_array[i].keyword) { |
| rc = -ENOMEM; |
| goto out; |
| } |
| |
| sscanf(cds_head, |
| "%s %llx %llx", |
| cdm_array[i].keyword, |
| (unsigned long long *)&(cdm_array[i].mask1), |
| (unsigned long long *)&(cdm_array[i].mask2)); |
| |
| if (!strcmp(cdm_array[i].keyword, ORANGEFS_VERBOSE)) |
| client_verbose_index = i; |
| |
| if (!strcmp(cdm_array[i].keyword, ORANGEFS_ALL)) |
| client_all_index = i; |
| |
| cds_head = cds_delimiter + 1; |
| } |
| |
| rc = cdm_element_count; |
| |
| gossip_debug(GOSSIP_UTILS_DEBUG, "%s: rc:%d:\n", __func__, rc); |
| |
| out: |
| |
| return rc; |
| |
| } |
| |
| /* |
| * /sys/kernel/debug/orangefs/debug-help can be catted to |
| * see all the available kernel and client debug keywords. |
| * |
| * When the kernel boots, we have no idea what keywords the |
| * client supports, nor their associated masks. |
| * |
| * We pass through this function once at boot and stamp a |
| * boilerplate "we don't know" message for the client in the |
| * debug-help file. We pass through here again when the client |
| * starts and then we can fill out the debug-help file fully. |
| * |
| * The client might be restarted any number of times between |
| * reboots, we only build the debug-help file the first time. |
| */ |
| int orangefs_prepare_debugfs_help_string(int at_boot) |
| { |
| int rc = -EINVAL; |
| int i; |
| int byte_count = 0; |
| char *client_title = "Client Debug Keywords:\n"; |
| char *kernel_title = "Kernel Debug Keywords:\n"; |
| |
| gossip_debug(GOSSIP_UTILS_DEBUG, "%s: start\n", __func__); |
| |
| if (at_boot) { |
| byte_count += strlen(HELP_STRING_UNINITIALIZED); |
| client_title = HELP_STRING_UNINITIALIZED; |
| } else { |
| /* |
| * fill the client keyword/mask array and remember |
| * how many elements there were. |
| */ |
| cdm_element_count = |
| orangefs_prepare_cdm_array(client_debug_array_string); |
| if (cdm_element_count <= 0) |
| goto out; |
| |
| /* Count the bytes destined for debug_help_string. */ |
| byte_count += strlen(client_title); |
| |
| for (i = 0; i < cdm_element_count; i++) { |
| byte_count += strlen(cdm_array[i].keyword + 2); |
| if (byte_count >= DEBUG_HELP_STRING_SIZE) { |
| pr_info("%s: overflow 1!\n", __func__); |
| goto out; |
| } |
| } |
| |
| gossip_debug(GOSSIP_UTILS_DEBUG, |
| "%s: cdm_element_count:%d:\n", |
| __func__, |
| cdm_element_count); |
| } |
| |
| byte_count += strlen(kernel_title); |
| for (i = 0; i < num_kmod_keyword_mask_map; i++) { |
| byte_count += |
| strlen(s_kmod_keyword_mask_map[i].keyword + 2); |
| if (byte_count >= DEBUG_HELP_STRING_SIZE) { |
| pr_info("%s: overflow 2!\n", __func__); |
| goto out; |
| } |
| } |
| |
| /* build debug_help_string. */ |
| debug_help_string = kzalloc(DEBUG_HELP_STRING_SIZE, GFP_KERNEL); |
| if (!debug_help_string) { |
| rc = -ENOMEM; |
| goto out; |
| } |
| |
| strcat(debug_help_string, client_title); |
| |
| if (!at_boot) { |
| for (i = 0; i < cdm_element_count; i++) { |
| strcat(debug_help_string, "\t"); |
| strcat(debug_help_string, cdm_array[i].keyword); |
| strcat(debug_help_string, "\n"); |
| } |
| } |
| |
| strcat(debug_help_string, "\n"); |
| strcat(debug_help_string, kernel_title); |
| |
| for (i = 0; i < num_kmod_keyword_mask_map; i++) { |
| strcat(debug_help_string, "\t"); |
| strcat(debug_help_string, s_kmod_keyword_mask_map[i].keyword); |
| strcat(debug_help_string, "\n"); |
| } |
| |
| rc = 0; |
| |
| out: |
| |
| return rc; |
| |
| } |
| |
| /* |
| * kernel = type 0 |
| * client = type 1 |
| */ |
| void debug_mask_to_string(void *mask, int type) |
| { |
| int i; |
| int len = 0; |
| char *debug_string; |
| int element_count = 0; |
| |
| gossip_debug(GOSSIP_UTILS_DEBUG, "%s: start\n", __func__); |
| |
| if (type) { |
| debug_string = client_debug_string; |
| element_count = cdm_element_count; |
| } else { |
| debug_string = kernel_debug_string; |
| element_count = num_kmod_keyword_mask_map; |
| } |
| |
| memset(debug_string, 0, ORANGEFS_MAX_DEBUG_STRING_LEN); |
| |
| /* |
| * Some keywords, like "all" or "verbose", are amalgams of |
| * numerous other keywords. Make a special check for those |
| * before grinding through the whole mask only to find out |
| * later... |
| */ |
| if (check_amalgam_keyword(mask, type)) |
| goto out; |
| |
| /* Build the debug string. */ |
| for (i = 0; i < element_count; i++) |
| if (type) |
| do_c_string(mask, i); |
| else |
| do_k_string(mask, i); |
| |
| len = strlen(debug_string); |
| |
| if ((len) && (type)) |
| client_debug_string[len - 1] = '\0'; |
| else if (len) |
| kernel_debug_string[len - 1] = '\0'; |
| else if (type) |
| strcpy(client_debug_string, "none"); |
| else |
| strcpy(kernel_debug_string, "none"); |
| |
| out: |
| gossip_debug(GOSSIP_UTILS_DEBUG, "%s: string:%s:\n", __func__, debug_string); |
| |
| return; |
| |
| } |
| |
| void do_k_string(void *k_mask, int index) |
| { |
| __u64 *mask = (__u64 *) k_mask; |
| |
| if (keyword_is_amalgam((char *) s_kmod_keyword_mask_map[index].keyword)) |
| goto out; |
| |
| if (*mask & s_kmod_keyword_mask_map[index].mask_val) { |
| if ((strlen(kernel_debug_string) + |
| strlen(s_kmod_keyword_mask_map[index].keyword)) |
| < ORANGEFS_MAX_DEBUG_STRING_LEN - 1) { |
| strcat(kernel_debug_string, |
| s_kmod_keyword_mask_map[index].keyword); |
| strcat(kernel_debug_string, ","); |
| } else { |
| gossip_err("%s: overflow!\n", __func__); |
| strcpy(kernel_debug_string, ORANGEFS_ALL); |
| goto out; |
| } |
| } |
| |
| out: |
| |
| return; |
| } |
| |
| void do_c_string(void *c_mask, int index) |
| { |
| struct client_debug_mask *mask = (struct client_debug_mask *) c_mask; |
| |
| if (keyword_is_amalgam(cdm_array[index].keyword)) |
| goto out; |
| |
| if ((mask->mask1 & cdm_array[index].mask1) || |
| (mask->mask2 & cdm_array[index].mask2)) { |
| if ((strlen(client_debug_string) + |
| strlen(cdm_array[index].keyword) + 1) |
| < ORANGEFS_MAX_DEBUG_STRING_LEN - 2) { |
| strcat(client_debug_string, |
| cdm_array[index].keyword); |
| strcat(client_debug_string, ","); |
| } else { |
| gossip_err("%s: overflow!\n", __func__); |
| strcpy(client_debug_string, ORANGEFS_ALL); |
| goto out; |
| } |
| } |
| out: |
| return; |
| } |
| |
| int keyword_is_amalgam(char *keyword) |
| { |
| int rc = 0; |
| |
| if ((!strcmp(keyword, ORANGEFS_ALL)) || (!strcmp(keyword, ORANGEFS_VERBOSE))) |
| rc = 1; |
| |
| return rc; |
| } |
| |
| /* |
| * kernel = type 0 |
| * client = type 1 |
| * |
| * return 1 if we found an amalgam. |
| */ |
| int check_amalgam_keyword(void *mask, int type) |
| { |
| __u64 *k_mask; |
| struct client_debug_mask *c_mask; |
| int k_all_index = num_kmod_keyword_mask_map - 1; |
| int rc = 0; |
| |
| if (type) { |
| c_mask = (struct client_debug_mask *) mask; |
| |
| if ((c_mask->mask1 == cdm_array[client_all_index].mask1) && |
| (c_mask->mask2 == cdm_array[client_all_index].mask2)) { |
| strcpy(client_debug_string, ORANGEFS_ALL); |
| rc = 1; |
| goto out; |
| } |
| |
| if ((c_mask->mask1 == cdm_array[client_verbose_index].mask1) && |
| (c_mask->mask2 == cdm_array[client_verbose_index].mask2)) { |
| strcpy(client_debug_string, ORANGEFS_VERBOSE); |
| rc = 1; |
| goto out; |
| } |
| |
| } else { |
| k_mask = (__u64 *) mask; |
| |
| if (*k_mask >= s_kmod_keyword_mask_map[k_all_index].mask_val) { |
| strcpy(kernel_debug_string, ORANGEFS_ALL); |
| rc = 1; |
| goto out; |
| } |
| } |
| |
| out: |
| |
| return rc; |
| } |
| |
| /* |
| * kernel = type 0 |
| * client = type 1 |
| */ |
| void debug_string_to_mask(char *debug_string, void *mask, int type) |
| { |
| char *unchecked_keyword; |
| int i; |
| char *strsep_fodder = kstrdup(debug_string, GFP_KERNEL); |
| char *original_pointer; |
| int element_count = 0; |
| struct client_debug_mask *c_mask; |
| __u64 *k_mask; |
| |
| gossip_debug(GOSSIP_UTILS_DEBUG, "%s: start\n", __func__); |
| |
| if (type) { |
| c_mask = (struct client_debug_mask *)mask; |
| element_count = cdm_element_count; |
| } else { |
| k_mask = (__u64 *)mask; |
| *k_mask = 0; |
| element_count = num_kmod_keyword_mask_map; |
| } |
| |
| original_pointer = strsep_fodder; |
| while ((unchecked_keyword = strsep(&strsep_fodder, ","))) |
| if (strlen(unchecked_keyword)) { |
| for (i = 0; i < element_count; i++) |
| if (type) |
| do_c_mask(i, |
| unchecked_keyword, |
| &c_mask); |
| else |
| do_k_mask(i, |
| unchecked_keyword, |
| &k_mask); |
| } |
| |
| kfree(original_pointer); |
| } |
| |
| void do_c_mask(int i, |
| char *unchecked_keyword, |
| struct client_debug_mask **sane_mask) |
| { |
| |
| if (!strcmp(cdm_array[i].keyword, unchecked_keyword)) { |
| (**sane_mask).mask1 = (**sane_mask).mask1 | cdm_array[i].mask1; |
| (**sane_mask).mask2 = (**sane_mask).mask2 | cdm_array[i].mask2; |
| } |
| } |
| |
| void do_k_mask(int i, char *unchecked_keyword, __u64 **sane_mask) |
| { |
| |
| if (!strcmp(s_kmod_keyword_mask_map[i].keyword, unchecked_keyword)) |
| **sane_mask = (**sane_mask) | |
| s_kmod_keyword_mask_map[i].mask_val; |
| } |