| /* |
| * GPL HEADER START |
| * |
| * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. |
| * |
| * This program is free software; you can redistribute it and/or modify |
| * it under the terms of the GNU General Public License version 2 only, |
| * as published by the Free Software Foundation. |
| * |
| * This program is distributed in the hope that it will be useful, but |
| * WITHOUT ANY WARRANTY; without even the implied warranty of |
| * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
| * General Public License version 2 for more details (a copy is included |
| * in the LICENSE file that accompanied this code). |
| * |
| * You should have received a copy of the GNU General Public License |
| * version 2 along with this program; If not, see |
| * http://www.sun.com/software/products/lustre/docs/GPLv2.pdf |
| * |
| * Please contact Sun Microsystems, Inc., 4150 Network Circle, Santa Clara, |
| * CA 95054 USA or visit www.sun.com if you need additional information or |
| * have any questions. |
| * |
| * GPL HEADER END |
| */ |
| /* |
| * Copyright (c) 2008, 2010, Oracle and/or its affiliates. All rights reserved. |
| * Use is subject to license terms. |
| * |
| * Copyright (c) 2011, 2015, Intel Corporation. |
| */ |
| /* |
| * This file is part of Lustre, http://www.lustre.org/ |
| * Lustre is a trademark of Sun Microsystems, Inc. |
| * |
| * Implementation of cl_io for LOV layer. |
| * |
| * Author: Nikita Danilov <nikita.danilov@sun.com> |
| * Author: Jinshan Xiong <jinshan.xiong@whamcloud.com> |
| */ |
| |
| #define DEBUG_SUBSYSTEM S_LOV |
| |
| #include "lov_cl_internal.h" |
| |
| /** \addtogroup lov |
| * @{ |
| */ |
| |
| static inline void lov_sub_enter(struct lov_io_sub *sub) |
| { |
| sub->sub_reenter++; |
| } |
| |
| static inline void lov_sub_exit(struct lov_io_sub *sub) |
| { |
| sub->sub_reenter--; |
| } |
| |
| static void lov_io_sub_fini(const struct lu_env *env, struct lov_io *lio, |
| struct lov_io_sub *sub) |
| { |
| if (sub->sub_io) { |
| if (sub->sub_io_initialized) { |
| lov_sub_enter(sub); |
| cl_io_fini(sub->sub_env, sub->sub_io); |
| lov_sub_exit(sub); |
| sub->sub_io_initialized = 0; |
| lio->lis_active_subios--; |
| } |
| if (sub->sub_stripe == lio->lis_single_subio_index) |
| lio->lis_single_subio_index = -1; |
| else if (!sub->sub_borrowed) |
| kfree(sub->sub_io); |
| sub->sub_io = NULL; |
| } |
| if (!IS_ERR_OR_NULL(sub->sub_env)) { |
| if (!sub->sub_borrowed) |
| cl_env_put(sub->sub_env, &sub->sub_refcheck); |
| sub->sub_env = NULL; |
| } |
| } |
| |
| static void lov_io_sub_inherit(struct cl_io *io, struct lov_io *lio, |
| int stripe, loff_t start, loff_t end) |
| { |
| struct lov_stripe_md *lsm = lio->lis_object->lo_lsm; |
| struct cl_io *parent = lio->lis_cl.cis_io; |
| |
| switch (io->ci_type) { |
| case CIT_SETATTR: { |
| io->u.ci_setattr.sa_attr = parent->u.ci_setattr.sa_attr; |
| io->u.ci_setattr.sa_valid = parent->u.ci_setattr.sa_valid; |
| if (cl_io_is_trunc(io)) { |
| loff_t new_size = parent->u.ci_setattr.sa_attr.lvb_size; |
| |
| new_size = lov_size_to_stripe(lsm, new_size, stripe); |
| io->u.ci_setattr.sa_attr.lvb_size = new_size; |
| } |
| break; |
| } |
| case CIT_FAULT: { |
| struct cl_object *obj = parent->ci_obj; |
| loff_t off = cl_offset(obj, parent->u.ci_fault.ft_index); |
| |
| io->u.ci_fault = parent->u.ci_fault; |
| off = lov_size_to_stripe(lsm, off, stripe); |
| io->u.ci_fault.ft_index = cl_index(obj, off); |
| break; |
| } |
| case CIT_FSYNC: { |
| io->u.ci_fsync.fi_start = start; |
| io->u.ci_fsync.fi_end = end; |
| io->u.ci_fsync.fi_fid = parent->u.ci_fsync.fi_fid; |
| io->u.ci_fsync.fi_mode = parent->u.ci_fsync.fi_mode; |
| break; |
| } |
| case CIT_READ: |
| case CIT_WRITE: { |
| io->u.ci_wr.wr_sync = cl_io_is_sync_write(parent); |
| if (cl_io_is_append(parent)) { |
| io->u.ci_wr.wr_append = 1; |
| } else { |
| io->u.ci_rw.crw_pos = start; |
| io->u.ci_rw.crw_count = end - start; |
| } |
| break; |
| } |
| default: |
| break; |
| } |
| } |
| |
| static int lov_io_sub_init(const struct lu_env *env, struct lov_io *lio, |
| struct lov_io_sub *sub) |
| { |
| struct lov_object *lov = lio->lis_object; |
| struct lov_device *ld = lu2lov_dev(lov2cl(lov)->co_lu.lo_dev); |
| struct cl_io *sub_io; |
| struct cl_object *sub_obj; |
| struct cl_io *io = lio->lis_cl.cis_io; |
| |
| int stripe = sub->sub_stripe; |
| int result; |
| |
| LASSERT(!sub->sub_io); |
| LASSERT(!sub->sub_env); |
| LASSERT(sub->sub_stripe < lio->lis_stripe_count); |
| |
| if (unlikely(!lov_r0(lov)->lo_sub[stripe])) |
| return -EIO; |
| |
| result = 0; |
| sub->sub_io_initialized = 0; |
| sub->sub_borrowed = 0; |
| |
| if (lio->lis_mem_frozen) { |
| LASSERT(mutex_is_locked(&ld->ld_mutex)); |
| sub->sub_io = &ld->ld_emrg[stripe]->emrg_subio; |
| sub->sub_env = ld->ld_emrg[stripe]->emrg_env; |
| sub->sub_borrowed = 1; |
| } else { |
| void *cookie; |
| |
| /* obtain new environment */ |
| cookie = cl_env_reenter(); |
| sub->sub_env = cl_env_get(&sub->sub_refcheck); |
| cl_env_reexit(cookie); |
| if (IS_ERR(sub->sub_env)) |
| result = PTR_ERR(sub->sub_env); |
| |
| if (result == 0) { |
| /* |
| * First sub-io. Use ->lis_single_subio to |
| * avoid dynamic allocation. |
| */ |
| if (lio->lis_active_subios == 0) { |
| sub->sub_io = &lio->lis_single_subio; |
| lio->lis_single_subio_index = stripe; |
| } else { |
| sub->sub_io = kzalloc(sizeof(*sub->sub_io), |
| GFP_NOFS); |
| if (!sub->sub_io) |
| result = -ENOMEM; |
| } |
| } |
| } |
| |
| if (result == 0) { |
| sub_obj = lovsub2cl(lov_r0(lov)->lo_sub[stripe]); |
| sub_io = sub->sub_io; |
| |
| sub_io->ci_obj = sub_obj; |
| sub_io->ci_result = 0; |
| |
| sub_io->ci_parent = io; |
| sub_io->ci_lockreq = io->ci_lockreq; |
| sub_io->ci_type = io->ci_type; |
| sub_io->ci_no_srvlock = io->ci_no_srvlock; |
| sub_io->ci_noatime = io->ci_noatime; |
| |
| lov_sub_enter(sub); |
| result = cl_io_sub_init(sub->sub_env, sub_io, |
| io->ci_type, sub_obj); |
| lov_sub_exit(sub); |
| if (result >= 0) { |
| lio->lis_active_subios++; |
| sub->sub_io_initialized = 1; |
| result = 0; |
| } |
| } |
| if (result != 0) |
| lov_io_sub_fini(env, lio, sub); |
| return result; |
| } |
| |
| struct lov_io_sub *lov_sub_get(const struct lu_env *env, |
| struct lov_io *lio, int stripe) |
| { |
| int rc; |
| struct lov_io_sub *sub = &lio->lis_subs[stripe]; |
| |
| LASSERT(stripe < lio->lis_stripe_count); |
| |
| if (!sub->sub_io_initialized) { |
| sub->sub_stripe = stripe; |
| rc = lov_io_sub_init(env, lio, sub); |
| } else { |
| rc = 0; |
| } |
| if (rc == 0) |
| lov_sub_enter(sub); |
| else |
| sub = ERR_PTR(rc); |
| return sub; |
| } |
| |
| void lov_sub_put(struct lov_io_sub *sub) |
| { |
| lov_sub_exit(sub); |
| } |
| |
| /***************************************************************************** |
| * |
| * Lov io operations. |
| * |
| */ |
| |
| int lov_page_stripe(const struct cl_page *page) |
| { |
| struct lovsub_object *subobj; |
| const struct cl_page_slice *slice; |
| |
| slice = cl_page_at(page, &lovsub_device_type); |
| LASSERT(slice->cpl_obj); |
| |
| subobj = cl2lovsub(slice->cpl_obj); |
| return subobj->lso_index; |
| } |
| |
| struct lov_io_sub *lov_page_subio(const struct lu_env *env, struct lov_io *lio, |
| const struct cl_page_slice *slice) |
| { |
| struct lov_stripe_md *lsm = lio->lis_object->lo_lsm; |
| struct cl_page *page = slice->cpl_page; |
| int stripe; |
| |
| LASSERT(lio->lis_cl.cis_io); |
| LASSERT(cl2lov(slice->cpl_obj) == lio->lis_object); |
| LASSERT(lsm); |
| LASSERT(lio->lis_nr_subios > 0); |
| |
| stripe = lov_page_stripe(page); |
| return lov_sub_get(env, lio, stripe); |
| } |
| |
| static int lov_io_subio_init(const struct lu_env *env, struct lov_io *lio, |
| struct cl_io *io) |
| { |
| struct lov_stripe_md *lsm; |
| int result; |
| |
| LASSERT(lio->lis_object); |
| lsm = lio->lis_object->lo_lsm; |
| |
| /* |
| * Need to be optimized, we can't afford to allocate a piece of memory |
| * when writing a page. -jay |
| */ |
| lio->lis_subs = |
| libcfs_kvzalloc(lsm->lsm_stripe_count * |
| sizeof(lio->lis_subs[0]), |
| GFP_NOFS); |
| if (lio->lis_subs) { |
| lio->lis_nr_subios = lio->lis_stripe_count; |
| lio->lis_single_subio_index = -1; |
| lio->lis_active_subios = 0; |
| result = 0; |
| } else { |
| result = -ENOMEM; |
| } |
| return result; |
| } |
| |
| static void lov_io_slice_init(struct lov_io *lio, |
| struct lov_object *obj, struct cl_io *io) |
| { |
| io->ci_result = 0; |
| lio->lis_object = obj; |
| |
| lio->lis_stripe_count = obj->lo_lsm->lsm_stripe_count; |
| |
| switch (io->ci_type) { |
| case CIT_READ: |
| case CIT_WRITE: |
| lio->lis_pos = io->u.ci_rw.crw_pos; |
| lio->lis_endpos = io->u.ci_rw.crw_pos + io->u.ci_rw.crw_count; |
| lio->lis_io_endpos = lio->lis_endpos; |
| if (cl_io_is_append(io)) { |
| LASSERT(io->ci_type == CIT_WRITE); |
| lio->lis_pos = 0; |
| lio->lis_endpos = OBD_OBJECT_EOF; |
| } |
| break; |
| |
| case CIT_SETATTR: |
| if (cl_io_is_trunc(io)) |
| lio->lis_pos = io->u.ci_setattr.sa_attr.lvb_size; |
| else |
| lio->lis_pos = 0; |
| lio->lis_endpos = OBD_OBJECT_EOF; |
| break; |
| |
| case CIT_FAULT: { |
| pgoff_t index = io->u.ci_fault.ft_index; |
| |
| lio->lis_pos = cl_offset(io->ci_obj, index); |
| lio->lis_endpos = cl_offset(io->ci_obj, index + 1); |
| break; |
| } |
| |
| case CIT_FSYNC: { |
| lio->lis_pos = io->u.ci_fsync.fi_start; |
| lio->lis_endpos = io->u.ci_fsync.fi_end; |
| break; |
| } |
| |
| case CIT_MISC: |
| lio->lis_pos = 0; |
| lio->lis_endpos = OBD_OBJECT_EOF; |
| break; |
| |
| default: |
| LBUG(); |
| } |
| } |
| |
| static void lov_io_fini(const struct lu_env *env, const struct cl_io_slice *ios) |
| { |
| struct lov_io *lio = cl2lov_io(env, ios); |
| struct lov_object *lov = cl2lov(ios->cis_obj); |
| int i; |
| |
| if (lio->lis_subs) { |
| for (i = 0; i < lio->lis_nr_subios; i++) |
| lov_io_sub_fini(env, lio, &lio->lis_subs[i]); |
| kvfree(lio->lis_subs); |
| lio->lis_nr_subios = 0; |
| } |
| |
| LASSERT(atomic_read(&lov->lo_active_ios) > 0); |
| if (atomic_dec_and_test(&lov->lo_active_ios)) |
| wake_up_all(&lov->lo_waitq); |
| } |
| |
| static u64 lov_offset_mod(u64 val, int delta) |
| { |
| if (val != OBD_OBJECT_EOF) |
| val += delta; |
| return val; |
| } |
| |
| static int lov_io_iter_init(const struct lu_env *env, |
| const struct cl_io_slice *ios) |
| { |
| struct lov_io *lio = cl2lov_io(env, ios); |
| struct lov_stripe_md *lsm = lio->lis_object->lo_lsm; |
| struct lov_io_sub *sub; |
| u64 endpos; |
| u64 start; |
| u64 end; |
| int stripe; |
| int rc = 0; |
| |
| endpos = lov_offset_mod(lio->lis_endpos, -1); |
| for (stripe = 0; stripe < lio->lis_stripe_count; stripe++) { |
| if (!lov_stripe_intersects(lsm, stripe, lio->lis_pos, |
| endpos, &start, &end)) |
| continue; |
| |
| if (unlikely(!lov_r0(lio->lis_object)->lo_sub[stripe])) { |
| if (ios->cis_io->ci_type == CIT_READ || |
| ios->cis_io->ci_type == CIT_WRITE || |
| ios->cis_io->ci_type == CIT_FAULT) |
| return -EIO; |
| |
| continue; |
| } |
| |
| end = lov_offset_mod(end, 1); |
| sub = lov_sub_get(env, lio, stripe); |
| if (!IS_ERR(sub)) { |
| lov_io_sub_inherit(sub->sub_io, lio, stripe, |
| start, end); |
| rc = cl_io_iter_init(sub->sub_env, sub->sub_io); |
| lov_sub_put(sub); |
| CDEBUG(D_VFSTRACE, "shrink: %d [%llu, %llu)\n", |
| stripe, start, end); |
| } else { |
| rc = PTR_ERR(sub); |
| } |
| |
| if (!rc) |
| list_add_tail(&sub->sub_linkage, &lio->lis_active); |
| else |
| break; |
| } |
| return rc; |
| } |
| |
| static int lov_io_rw_iter_init(const struct lu_env *env, |
| const struct cl_io_slice *ios) |
| { |
| struct lov_io *lio = cl2lov_io(env, ios); |
| struct cl_io *io = ios->cis_io; |
| struct lov_stripe_md *lsm = lio->lis_object->lo_lsm; |
| __u64 start = io->u.ci_rw.crw_pos; |
| loff_t next; |
| unsigned long ssize = lsm->lsm_stripe_size; |
| |
| LASSERT(io->ci_type == CIT_READ || io->ci_type == CIT_WRITE); |
| |
| /* fast path for common case. */ |
| if (lio->lis_nr_subios != 1 && !cl_io_is_append(io)) { |
| lov_do_div64(start, ssize); |
| next = (start + 1) * ssize; |
| if (next <= start * ssize) |
| next = ~0ull; |
| |
| io->ci_continue = next < lio->lis_io_endpos; |
| io->u.ci_rw.crw_count = min_t(loff_t, lio->lis_io_endpos, |
| next) - io->u.ci_rw.crw_pos; |
| lio->lis_pos = io->u.ci_rw.crw_pos; |
| lio->lis_endpos = io->u.ci_rw.crw_pos + io->u.ci_rw.crw_count; |
| CDEBUG(D_VFSTRACE, "stripe: %llu chunk: [%llu, %llu) %llu\n", |
| (__u64)start, lio->lis_pos, lio->lis_endpos, |
| (__u64)lio->lis_io_endpos); |
| } |
| /* |
| * XXX The following call should be optimized: we know, that |
| * [lio->lis_pos, lio->lis_endpos) intersects with exactly one stripe. |
| */ |
| return lov_io_iter_init(env, ios); |
| } |
| |
| static int lov_io_call(const struct lu_env *env, struct lov_io *lio, |
| int (*iofunc)(const struct lu_env *, struct cl_io *)) |
| { |
| struct cl_io *parent = lio->lis_cl.cis_io; |
| struct lov_io_sub *sub; |
| int rc = 0; |
| |
| list_for_each_entry(sub, &lio->lis_active, sub_linkage) { |
| lov_sub_enter(sub); |
| rc = iofunc(sub->sub_env, sub->sub_io); |
| lov_sub_exit(sub); |
| if (rc) |
| break; |
| |
| if (parent->ci_result == 0) |
| parent->ci_result = sub->sub_io->ci_result; |
| } |
| return rc; |
| } |
| |
| static int lov_io_lock(const struct lu_env *env, const struct cl_io_slice *ios) |
| { |
| return lov_io_call(env, cl2lov_io(env, ios), cl_io_lock); |
| } |
| |
| static int lov_io_start(const struct lu_env *env, const struct cl_io_slice *ios) |
| { |
| return lov_io_call(env, cl2lov_io(env, ios), cl_io_start); |
| } |
| |
| static int lov_io_end_wrapper(const struct lu_env *env, struct cl_io *io) |
| { |
| /* |
| * It's possible that lov_io_start() wasn't called against this |
| * sub-io, either because previous sub-io failed, or upper layer |
| * completed IO. |
| */ |
| if (io->ci_state == CIS_IO_GOING) |
| cl_io_end(env, io); |
| else |
| io->ci_state = CIS_IO_FINISHED; |
| return 0; |
| } |
| |
| static int lov_io_iter_fini_wrapper(const struct lu_env *env, struct cl_io *io) |
| { |
| cl_io_iter_fini(env, io); |
| return 0; |
| } |
| |
| static int lov_io_unlock_wrapper(const struct lu_env *env, struct cl_io *io) |
| { |
| cl_io_unlock(env, io); |
| return 0; |
| } |
| |
| static void lov_io_end(const struct lu_env *env, const struct cl_io_slice *ios) |
| { |
| int rc; |
| |
| rc = lov_io_call(env, cl2lov_io(env, ios), lov_io_end_wrapper); |
| LASSERT(rc == 0); |
| } |
| |
| static void lov_io_iter_fini(const struct lu_env *env, |
| const struct cl_io_slice *ios) |
| { |
| struct lov_io *lio = cl2lov_io(env, ios); |
| int rc; |
| |
| rc = lov_io_call(env, lio, lov_io_iter_fini_wrapper); |
| LASSERT(rc == 0); |
| while (!list_empty(&lio->lis_active)) |
| list_del_init(lio->lis_active.next); |
| } |
| |
| static void lov_io_unlock(const struct lu_env *env, |
| const struct cl_io_slice *ios) |
| { |
| int rc; |
| |
| rc = lov_io_call(env, cl2lov_io(env, ios), lov_io_unlock_wrapper); |
| LASSERT(rc == 0); |
| } |
| |
| /** |
| * lov implementation of cl_operations::cio_submit() method. It takes a list |
| * of pages in \a queue, splits it into per-stripe sub-lists, invokes |
| * cl_io_submit() on underlying devices to submit sub-lists, and then splices |
| * everything back. |
| * |
| * Major complication of this function is a need to handle memory cleansing: |
| * cl_io_submit() is called to write out pages as a part of VM memory |
| * reclamation, and hence it may not fail due to memory shortages (system |
| * dead-locks otherwise). To deal with this, some resources (sub-lists, |
| * sub-environment, etc.) are allocated per-device on "startup" (i.e., in a |
| * not-memory cleansing context), and in case of memory shortage, these |
| * pre-allocated resources are used by lov_io_submit() under |
| * lov_device::ld_mutex mutex. |
| */ |
| static int lov_io_submit(const struct lu_env *env, |
| const struct cl_io_slice *ios, |
| enum cl_req_type crt, struct cl_2queue *queue) |
| { |
| struct cl_page_list *qin = &queue->c2_qin; |
| struct lov_io *lio = cl2lov_io(env, ios); |
| struct lov_io_sub *sub; |
| struct cl_page_list *plist = &lov_env_info(env)->lti_plist; |
| struct cl_page *page; |
| int stripe; |
| |
| int rc = 0; |
| |
| if (lio->lis_active_subios == 1) { |
| int idx = lio->lis_single_subio_index; |
| |
| LASSERT(idx < lio->lis_nr_subios); |
| sub = lov_sub_get(env, lio, idx); |
| LASSERT(!IS_ERR(sub)); |
| LASSERT(sub->sub_io == &lio->lis_single_subio); |
| rc = cl_io_submit_rw(sub->sub_env, sub->sub_io, |
| crt, queue); |
| lov_sub_put(sub); |
| return rc; |
| } |
| |
| LASSERT(lio->lis_subs); |
| |
| cl_page_list_init(plist); |
| while (qin->pl_nr > 0) { |
| struct cl_2queue *cl2q = &lov_env_info(env)->lti_cl2q; |
| |
| cl_2queue_init(cl2q); |
| |
| page = cl_page_list_first(qin); |
| cl_page_list_move(&cl2q->c2_qin, qin, page); |
| |
| stripe = lov_page_stripe(page); |
| while (qin->pl_nr > 0) { |
| page = cl_page_list_first(qin); |
| if (stripe != lov_page_stripe(page)) |
| break; |
| |
| cl_page_list_move(&cl2q->c2_qin, qin, page); |
| } |
| |
| sub = lov_sub_get(env, lio, stripe); |
| if (!IS_ERR(sub)) { |
| rc = cl_io_submit_rw(sub->sub_env, sub->sub_io, |
| crt, cl2q); |
| lov_sub_put(sub); |
| } else { |
| rc = PTR_ERR(sub); |
| } |
| |
| cl_page_list_splice(&cl2q->c2_qin, plist); |
| cl_page_list_splice(&cl2q->c2_qout, &queue->c2_qout); |
| cl_2queue_fini(env, cl2q); |
| |
| if (rc != 0) |
| break; |
| } |
| |
| cl_page_list_splice(plist, qin); |
| cl_page_list_fini(env, plist); |
| |
| return rc; |
| } |
| |
| static int lov_io_commit_async(const struct lu_env *env, |
| const struct cl_io_slice *ios, |
| struct cl_page_list *queue, int from, int to, |
| cl_commit_cbt cb) |
| { |
| struct cl_page_list *plist = &lov_env_info(env)->lti_plist; |
| struct lov_io *lio = cl2lov_io(env, ios); |
| struct lov_io_sub *sub; |
| struct cl_page *page; |
| int rc = 0; |
| |
| if (lio->lis_active_subios == 1) { |
| int idx = lio->lis_single_subio_index; |
| |
| LASSERT(idx < lio->lis_nr_subios); |
| sub = lov_sub_get(env, lio, idx); |
| LASSERT(!IS_ERR(sub)); |
| LASSERT(sub->sub_io == &lio->lis_single_subio); |
| rc = cl_io_commit_async(sub->sub_env, sub->sub_io, queue, |
| from, to, cb); |
| lov_sub_put(sub); |
| return rc; |
| } |
| |
| LASSERT(lio->lis_subs); |
| |
| cl_page_list_init(plist); |
| while (queue->pl_nr > 0) { |
| int stripe_to = to; |
| int stripe; |
| |
| LASSERT(plist->pl_nr == 0); |
| page = cl_page_list_first(queue); |
| cl_page_list_move(plist, queue, page); |
| |
| stripe = lov_page_stripe(page); |
| while (queue->pl_nr > 0) { |
| page = cl_page_list_first(queue); |
| if (stripe != lov_page_stripe(page)) |
| break; |
| |
| cl_page_list_move(plist, queue, page); |
| } |
| |
| if (queue->pl_nr > 0) /* still has more pages */ |
| stripe_to = PAGE_SIZE; |
| |
| sub = lov_sub_get(env, lio, stripe); |
| if (!IS_ERR(sub)) { |
| rc = cl_io_commit_async(sub->sub_env, sub->sub_io, |
| plist, from, stripe_to, cb); |
| lov_sub_put(sub); |
| } else { |
| rc = PTR_ERR(sub); |
| break; |
| } |
| |
| if (plist->pl_nr > 0) /* short write */ |
| break; |
| |
| from = 0; |
| } |
| |
| /* for error case, add the page back into the qin list */ |
| LASSERT(ergo(rc == 0, plist->pl_nr == 0)); |
| while (plist->pl_nr > 0) { |
| /* error occurred, add the uncommitted pages back into queue */ |
| page = cl_page_list_last(plist); |
| cl_page_list_move_head(queue, plist, page); |
| } |
| |
| return rc; |
| } |
| |
| static int lov_io_fault_start(const struct lu_env *env, |
| const struct cl_io_slice *ios) |
| { |
| struct cl_fault_io *fio; |
| struct lov_io *lio; |
| struct lov_io_sub *sub; |
| |
| fio = &ios->cis_io->u.ci_fault; |
| lio = cl2lov_io(env, ios); |
| sub = lov_sub_get(env, lio, lov_page_stripe(fio->ft_page)); |
| if (IS_ERR(sub)) |
| return PTR_ERR(sub); |
| sub->sub_io->u.ci_fault.ft_nob = fio->ft_nob; |
| lov_sub_put(sub); |
| return lov_io_start(env, ios); |
| } |
| |
| static void lov_io_fsync_end(const struct lu_env *env, |
| const struct cl_io_slice *ios) |
| { |
| struct lov_io *lio = cl2lov_io(env, ios); |
| struct lov_io_sub *sub; |
| unsigned int *written = &ios->cis_io->u.ci_fsync.fi_nr_written; |
| |
| *written = 0; |
| list_for_each_entry(sub, &lio->lis_active, sub_linkage) { |
| struct cl_io *subio = sub->sub_io; |
| |
| lov_sub_enter(sub); |
| lov_io_end_wrapper(sub->sub_env, subio); |
| lov_sub_exit(sub); |
| |
| if (subio->ci_result == 0) |
| *written += subio->u.ci_fsync.fi_nr_written; |
| } |
| } |
| |
| static const struct cl_io_operations lov_io_ops = { |
| .op = { |
| [CIT_READ] = { |
| .cio_fini = lov_io_fini, |
| .cio_iter_init = lov_io_rw_iter_init, |
| .cio_iter_fini = lov_io_iter_fini, |
| .cio_lock = lov_io_lock, |
| .cio_unlock = lov_io_unlock, |
| .cio_start = lov_io_start, |
| .cio_end = lov_io_end |
| }, |
| [CIT_WRITE] = { |
| .cio_fini = lov_io_fini, |
| .cio_iter_init = lov_io_rw_iter_init, |
| .cio_iter_fini = lov_io_iter_fini, |
| .cio_lock = lov_io_lock, |
| .cio_unlock = lov_io_unlock, |
| .cio_start = lov_io_start, |
| .cio_end = lov_io_end |
| }, |
| [CIT_SETATTR] = { |
| .cio_fini = lov_io_fini, |
| .cio_iter_init = lov_io_iter_init, |
| .cio_iter_fini = lov_io_iter_fini, |
| .cio_lock = lov_io_lock, |
| .cio_unlock = lov_io_unlock, |
| .cio_start = lov_io_start, |
| .cio_end = lov_io_end |
| }, |
| [CIT_FAULT] = { |
| .cio_fini = lov_io_fini, |
| .cio_iter_init = lov_io_iter_init, |
| .cio_iter_fini = lov_io_iter_fini, |
| .cio_lock = lov_io_lock, |
| .cio_unlock = lov_io_unlock, |
| .cio_start = lov_io_fault_start, |
| .cio_end = lov_io_end |
| }, |
| [CIT_FSYNC] = { |
| .cio_fini = lov_io_fini, |
| .cio_iter_init = lov_io_iter_init, |
| .cio_iter_fini = lov_io_iter_fini, |
| .cio_lock = lov_io_lock, |
| .cio_unlock = lov_io_unlock, |
| .cio_start = lov_io_start, |
| .cio_end = lov_io_fsync_end |
| }, |
| [CIT_MISC] = { |
| .cio_fini = lov_io_fini |
| } |
| }, |
| .cio_submit = lov_io_submit, |
| .cio_commit_async = lov_io_commit_async, |
| }; |
| |
| /***************************************************************************** |
| * |
| * Empty lov io operations. |
| * |
| */ |
| |
| static void lov_empty_io_fini(const struct lu_env *env, |
| const struct cl_io_slice *ios) |
| { |
| struct lov_object *lov = cl2lov(ios->cis_obj); |
| |
| if (atomic_dec_and_test(&lov->lo_active_ios)) |
| wake_up_all(&lov->lo_waitq); |
| } |
| |
| static void lov_empty_impossible(const struct lu_env *env, |
| struct cl_io_slice *ios) |
| { |
| LBUG(); |
| } |
| |
| #define LOV_EMPTY_IMPOSSIBLE ((void *)lov_empty_impossible) |
| |
| /** |
| * An io operation vector for files without stripes. |
| */ |
| static const struct cl_io_operations lov_empty_io_ops = { |
| .op = { |
| [CIT_READ] = { |
| .cio_fini = lov_empty_io_fini, |
| #if 0 |
| .cio_iter_init = LOV_EMPTY_IMPOSSIBLE, |
| .cio_lock = LOV_EMPTY_IMPOSSIBLE, |
| .cio_start = LOV_EMPTY_IMPOSSIBLE, |
| .cio_end = LOV_EMPTY_IMPOSSIBLE |
| #endif |
| }, |
| [CIT_WRITE] = { |
| .cio_fini = lov_empty_io_fini, |
| .cio_iter_init = LOV_EMPTY_IMPOSSIBLE, |
| .cio_lock = LOV_EMPTY_IMPOSSIBLE, |
| .cio_start = LOV_EMPTY_IMPOSSIBLE, |
| .cio_end = LOV_EMPTY_IMPOSSIBLE |
| }, |
| [CIT_SETATTR] = { |
| .cio_fini = lov_empty_io_fini, |
| .cio_iter_init = LOV_EMPTY_IMPOSSIBLE, |
| .cio_lock = LOV_EMPTY_IMPOSSIBLE, |
| .cio_start = LOV_EMPTY_IMPOSSIBLE, |
| .cio_end = LOV_EMPTY_IMPOSSIBLE |
| }, |
| [CIT_FAULT] = { |
| .cio_fini = lov_empty_io_fini, |
| .cio_iter_init = LOV_EMPTY_IMPOSSIBLE, |
| .cio_lock = LOV_EMPTY_IMPOSSIBLE, |
| .cio_start = LOV_EMPTY_IMPOSSIBLE, |
| .cio_end = LOV_EMPTY_IMPOSSIBLE |
| }, |
| [CIT_FSYNC] = { |
| .cio_fini = lov_empty_io_fini |
| }, |
| [CIT_MISC] = { |
| .cio_fini = lov_empty_io_fini |
| } |
| }, |
| .cio_submit = LOV_EMPTY_IMPOSSIBLE, |
| .cio_commit_async = LOV_EMPTY_IMPOSSIBLE |
| }; |
| |
| int lov_io_init_raid0(const struct lu_env *env, struct cl_object *obj, |
| struct cl_io *io) |
| { |
| struct lov_io *lio = lov_env_io(env); |
| struct lov_object *lov = cl2lov(obj); |
| |
| INIT_LIST_HEAD(&lio->lis_active); |
| lov_io_slice_init(lio, lov, io); |
| if (io->ci_result == 0) { |
| io->ci_result = lov_io_subio_init(env, lio, io); |
| if (io->ci_result == 0) { |
| cl_io_slice_add(io, &lio->lis_cl, obj, &lov_io_ops); |
| atomic_inc(&lov->lo_active_ios); |
| } |
| } |
| return io->ci_result; |
| } |
| |
| int lov_io_init_empty(const struct lu_env *env, struct cl_object *obj, |
| struct cl_io *io) |
| { |
| struct lov_object *lov = cl2lov(obj); |
| struct lov_io *lio = lov_env_io(env); |
| int result; |
| |
| lio->lis_object = lov; |
| switch (io->ci_type) { |
| default: |
| LBUG(); |
| case CIT_MISC: |
| case CIT_READ: |
| result = 0; |
| break; |
| case CIT_FSYNC: |
| case CIT_SETATTR: |
| result = 1; |
| break; |
| case CIT_WRITE: |
| result = -EBADF; |
| break; |
| case CIT_FAULT: |
| result = -EFAULT; |
| CERROR("Page fault on a file without stripes: "DFID"\n", |
| PFID(lu_object_fid(&obj->co_lu))); |
| break; |
| } |
| if (result == 0) { |
| cl_io_slice_add(io, &lio->lis_cl, obj, &lov_empty_io_ops); |
| atomic_inc(&lov->lo_active_ios); |
| } |
| |
| io->ci_result = result < 0 ? result : 0; |
| return result; |
| } |
| |
| int lov_io_init_released(const struct lu_env *env, struct cl_object *obj, |
| struct cl_io *io) |
| { |
| struct lov_object *lov = cl2lov(obj); |
| struct lov_io *lio = lov_env_io(env); |
| int result; |
| |
| LASSERT(lov->lo_lsm); |
| lio->lis_object = lov; |
| |
| switch (io->ci_type) { |
| default: |
| LASSERTF(0, "invalid type %d\n", io->ci_type); |
| case CIT_MISC: |
| case CIT_FSYNC: |
| result = 1; |
| break; |
| case CIT_SETATTR: |
| /* the truncate to 0 is managed by MDT: |
| * - in open, for open O_TRUNC |
| * - in setattr, for truncate |
| */ |
| /* the truncate is for size > 0 so triggers a restore */ |
| if (cl_io_is_trunc(io)) |
| io->ci_restore_needed = 1; |
| result = -ENODATA; |
| break; |
| case CIT_READ: |
| case CIT_WRITE: |
| case CIT_FAULT: |
| io->ci_restore_needed = 1; |
| result = -ENODATA; |
| break; |
| } |
| if (result == 0) { |
| cl_io_slice_add(io, &lio->lis_cl, obj, &lov_empty_io_ops); |
| atomic_inc(&lov->lo_active_ios); |
| } |
| |
| io->ci_result = result < 0 ? result : 0; |
| return result; |
| } |
| |
| /** @} lov */ |