Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 1 | /* |
| 2 | * GPL HEADER START |
| 3 | * |
| 4 | * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. |
| 5 | * |
| 6 | * This program is free software; you can redistribute it and/or modify |
| 7 | * it under the terms of the GNU General Public License version 2 only, |
| 8 | * as published by the Free Software Foundation. |
| 9 | * |
| 10 | * This program is distributed in the hope that it will be useful, but |
| 11 | * WITHOUT ANY WARRANTY; without even the implied warranty of |
| 12 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
| 13 | * General Public License version 2 for more details (a copy is included |
| 14 | * in the LICENSE file that accompanied this code). |
| 15 | * |
| 16 | * You should have received a copy of the GNU General Public License |
| 17 | * version 2 along with this program; If not, see |
Oleg Drokin | 6a5b99a | 2016-06-14 23:33:40 -0400 | [diff] [blame] | 18 | * http://www.gnu.org/licenses/gpl-2.0.html |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 19 | * |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 20 | * GPL HEADER END |
| 21 | */ |
| 22 | /* |
| 23 | * Copyright (c) 2008, 2010, Oracle and/or its affiliates. All rights reserved. |
| 24 | * Use is subject to license terms. |
| 25 | * |
Andreas Dilger | 1dc563a | 2015-11-08 18:09:37 -0500 | [diff] [blame] | 26 | * Copyright (c) 2011, 2015, Intel Corporation. |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 27 | */ |
| 28 | /* |
| 29 | * This file is part of Lustre, http://www.lustre.org/ |
| 30 | * Lustre is a trademark of Sun Microsystems, Inc. |
| 31 | * |
| 32 | * Implementation of cl_page for OSC layer. |
| 33 | * |
| 34 | * Author: Nikita Danilov <nikita.danilov@sun.com> |
Jinshan Xiong | d9d4790 | 2016-03-30 19:48:28 -0400 | [diff] [blame] | 35 | * Author: Jinshan Xiong <jinshan.xiong@intel.com> |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 36 | */ |
| 37 | |
| 38 | #define DEBUG_SUBSYSTEM S_OSC |
| 39 | |
| 40 | #include "osc_cl_internal.h" |
| 41 | |
Jinshan Xiong | 5196e42 | 2016-03-30 19:48:26 -0400 | [diff] [blame] | 42 | static void osc_lru_del(struct client_obd *cli, struct osc_page *opg); |
| 43 | static void osc_lru_use(struct client_obd *cli, struct osc_page *opg); |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 44 | static int osc_lru_reserve(const struct lu_env *env, struct osc_object *obj, |
| 45 | struct osc_page *opg); |
| 46 | |
| 47 | /** \addtogroup osc |
| 48 | * @{ |
| 49 | */ |
| 50 | |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 51 | /***************************************************************************** |
| 52 | * |
| 53 | * Page operations. |
| 54 | * |
| 55 | */ |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 56 | static void osc_page_transfer_get(struct osc_page *opg, const char *label) |
| 57 | { |
Jinshan Xiong | 7addf40 | 2016-03-30 19:48:32 -0400 | [diff] [blame] | 58 | struct cl_page *page = opg->ops_cl.cpl_page; |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 59 | |
| 60 | LASSERT(!opg->ops_transfer_pinned); |
| 61 | cl_page_get(page); |
| 62 | lu_ref_add_atomic(&page->cp_reference, label, page); |
| 63 | opg->ops_transfer_pinned = 1; |
| 64 | } |
| 65 | |
| 66 | static void osc_page_transfer_put(const struct lu_env *env, |
| 67 | struct osc_page *opg) |
| 68 | { |
Jinshan Xiong | 7addf40 | 2016-03-30 19:48:32 -0400 | [diff] [blame] | 69 | struct cl_page *page = opg->ops_cl.cpl_page; |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 70 | |
| 71 | if (opg->ops_transfer_pinned) { |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 72 | opg->ops_transfer_pinned = 0; |
Jinshan Xiong | 77605e4 | 2016-03-30 19:48:30 -0400 | [diff] [blame] | 73 | lu_ref_del(&page->cp_reference, "transfer", page); |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 74 | cl_page_put(env, page); |
| 75 | } |
| 76 | } |
| 77 | |
| 78 | /** |
| 79 | * This is called once for every page when it is submitted for a transfer |
| 80 | * either opportunistic (osc_page_cache_add()), or immediate |
| 81 | * (osc_page_submit()). |
| 82 | */ |
| 83 | static void osc_page_transfer_add(const struct lu_env *env, |
| 84 | struct osc_page *opg, enum cl_req_type crt) |
| 85 | { |
| 86 | struct osc_object *obj = cl2osc(opg->ops_cl.cpl_obj); |
| 87 | |
Jinshan Xiong | 5196e42 | 2016-03-30 19:48:26 -0400 | [diff] [blame] | 88 | osc_lru_use(osc_cli(obj), opg); |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 89 | |
| 90 | spin_lock(&obj->oo_seatbelt); |
| 91 | list_add(&opg->ops_inflight, &obj->oo_inflight[crt]); |
| 92 | opg->ops_submitter = current; |
| 93 | spin_unlock(&obj->oo_seatbelt); |
| 94 | } |
| 95 | |
Jinshan Xiong | 77605e4 | 2016-03-30 19:48:30 -0400 | [diff] [blame] | 96 | int osc_page_cache_add(const struct lu_env *env, |
| 97 | const struct cl_page_slice *slice, struct cl_io *io) |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 98 | { |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 99 | struct osc_page *opg = cl2osc_page(slice); |
| 100 | int result; |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 101 | |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 102 | osc_page_transfer_get(opg, "transfer\0cache"); |
| 103 | result = osc_queue_async_io(env, io, opg); |
| 104 | if (result != 0) |
| 105 | osc_page_transfer_put(env, opg); |
| 106 | else |
| 107 | osc_page_transfer_add(env, opg, CRT_WRITE); |
| 108 | |
Greg Kroah-Hartman | 0a3bdb0 | 2013-08-03 10:35:28 +0800 | [diff] [blame] | 109 | return result; |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 110 | } |
| 111 | |
| 112 | void osc_index2policy(ldlm_policy_data_t *policy, const struct cl_object *obj, |
| 113 | pgoff_t start, pgoff_t end) |
| 114 | { |
Joe Perches | ec83e61 | 2013-10-13 20:22:03 -0700 | [diff] [blame] | 115 | memset(policy, 0, sizeof(*policy)); |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 116 | policy->l_extent.start = cl_offset(obj, start); |
Chris Hanna | 29ac684 | 2015-06-03 10:23:42 -0400 | [diff] [blame] | 117 | policy->l_extent.end = cl_offset(obj, end + 1) - 1; |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 118 | } |
| 119 | |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 120 | static int osc_page_is_under_lock(const struct lu_env *env, |
| 121 | const struct cl_page_slice *slice, |
Jinshan Xiong | fd7444f | 2016-03-30 19:48:33 -0400 | [diff] [blame] | 122 | struct cl_io *unused, pgoff_t *max_index) |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 123 | { |
Jinshan Xiong | 7addf40 | 2016-03-30 19:48:32 -0400 | [diff] [blame] | 124 | struct osc_page *opg = cl2osc_page(slice); |
Jinshan Xiong | 06563b5 | 2016-03-30 19:48:40 -0400 | [diff] [blame] | 125 | struct ldlm_lock *dlmlock; |
Chris Hanna | 29ac684 | 2015-06-03 10:23:42 -0400 | [diff] [blame] | 126 | int result = -ENODATA; |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 127 | |
Jinshan Xiong | 06563b5 | 2016-03-30 19:48:40 -0400 | [diff] [blame] | 128 | dlmlock = osc_dlmlock_at_pgoff(env, cl2osc(slice->cpl_obj), |
| 129 | osc_index(opg), 1, 0); |
| 130 | if (dlmlock) { |
| 131 | *max_index = cl_index(slice->cpl_obj, |
| 132 | dlmlock->l_policy_data.l_extent.end); |
| 133 | LDLM_LOCK_PUT(dlmlock); |
Jinshan Xiong | fd7444f | 2016-03-30 19:48:33 -0400 | [diff] [blame] | 134 | result = 0; |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 135 | } |
Greg Kroah-Hartman | 0a3bdb0 | 2013-08-03 10:35:28 +0800 | [diff] [blame] | 136 | return result; |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 137 | } |
| 138 | |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 139 | static const char *osc_list(struct list_head *head) |
| 140 | { |
| 141 | return list_empty(head) ? "-" : "+"; |
| 142 | } |
| 143 | |
Greg Kroah-Hartman | a649ad1 | 2014-07-12 00:27:46 -0700 | [diff] [blame] | 144 | static inline unsigned long osc_submit_duration(struct osc_page *opg) |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 145 | { |
| 146 | if (opg->ops_submit_time == 0) |
| 147 | return 0; |
| 148 | |
| 149 | return (cfs_time_current() - opg->ops_submit_time); |
| 150 | } |
| 151 | |
| 152 | static int osc_page_print(const struct lu_env *env, |
| 153 | const struct cl_page_slice *slice, |
| 154 | void *cookie, lu_printer_t printer) |
| 155 | { |
Chris Hanna | 29ac684 | 2015-06-03 10:23:42 -0400 | [diff] [blame] | 156 | struct osc_page *opg = cl2osc_page(slice); |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 157 | struct osc_async_page *oap = &opg->ops_oap; |
Chris Hanna | 29ac684 | 2015-06-03 10:23:42 -0400 | [diff] [blame] | 158 | struct osc_object *obj = cl2osc(slice->cpl_obj); |
| 159 | struct client_obd *cli = &osc_export(obj)->exp_obd->u.cli; |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 160 | |
Jinshan Xiong | 7addf40 | 2016-03-30 19:48:32 -0400 | [diff] [blame] | 161 | return (*printer)(env, cookie, LUSTRE_OSC_NAME "-page@%p %lu: 1< %#x %d %u %s %s > 2< %llu %u %u %#x %#x | %p %p %p > 3< %s %p %d %lu %d > 4< %d %d %d %lu %s | %s %s %s %s > 5< %s %s %s %s | %d %s | %d %s %s>\n", |
| 162 | opg, osc_index(opg), |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 163 | /* 1 */ |
| 164 | oap->oap_magic, oap->oap_cmd, |
| 165 | oap->oap_interrupted, |
| 166 | osc_list(&oap->oap_pending_item), |
| 167 | osc_list(&oap->oap_rpc_item), |
| 168 | /* 2 */ |
| 169 | oap->oap_obj_off, oap->oap_page_off, oap->oap_count, |
| 170 | oap->oap_async_flags, oap->oap_brw_flags, |
| 171 | oap->oap_request, oap->oap_cli, obj, |
| 172 | /* 3 */ |
| 173 | osc_list(&opg->ops_inflight), |
| 174 | opg->ops_submitter, opg->ops_transfer_pinned, |
| 175 | osc_submit_duration(opg), opg->ops_srvlock, |
| 176 | /* 4 */ |
| 177 | cli->cl_r_in_flight, cli->cl_w_in_flight, |
| 178 | cli->cl_max_rpcs_in_flight, |
| 179 | cli->cl_avail_grant, |
| 180 | osc_list(&cli->cl_cache_waiters), |
| 181 | osc_list(&cli->cl_loi_ready_list), |
| 182 | osc_list(&cli->cl_loi_hp_ready_list), |
| 183 | osc_list(&cli->cl_loi_write_list), |
| 184 | osc_list(&cli->cl_loi_read_list), |
| 185 | /* 5 */ |
| 186 | osc_list(&obj->oo_ready_item), |
| 187 | osc_list(&obj->oo_hp_ready_item), |
| 188 | osc_list(&obj->oo_write_item), |
| 189 | osc_list(&obj->oo_read_item), |
| 190 | atomic_read(&obj->oo_nr_reads), |
| 191 | osc_list(&obj->oo_reading_exts), |
| 192 | atomic_read(&obj->oo_nr_writes), |
| 193 | osc_list(&obj->oo_hp_exts), |
| 194 | osc_list(&obj->oo_urgent_exts)); |
| 195 | } |
| 196 | |
| 197 | static void osc_page_delete(const struct lu_env *env, |
| 198 | const struct cl_page_slice *slice) |
| 199 | { |
Chris Hanna | 29ac684 | 2015-06-03 10:23:42 -0400 | [diff] [blame] | 200 | struct osc_page *opg = cl2osc_page(slice); |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 201 | struct osc_object *obj = cl2osc(opg->ops_cl.cpl_obj); |
| 202 | int rc; |
| 203 | |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 204 | CDEBUG(D_TRACE, "%p\n", opg); |
| 205 | osc_page_transfer_put(env, opg); |
| 206 | rc = osc_teardown_async_page(env, obj, opg); |
| 207 | if (rc) { |
Jinshan Xiong | 7addf40 | 2016-03-30 19:48:32 -0400 | [diff] [blame] | 208 | CL_PAGE_DEBUG(D_ERROR, env, slice->cpl_page, |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 209 | "Trying to teardown failed: %d\n", rc); |
| 210 | LASSERT(0); |
| 211 | } |
| 212 | |
| 213 | spin_lock(&obj->oo_seatbelt); |
Oleg Drokin | 7f1ae4c | 2016-02-16 00:46:57 -0500 | [diff] [blame] | 214 | if (opg->ops_submitter) { |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 215 | LASSERT(!list_empty(&opg->ops_inflight)); |
| 216 | list_del_init(&opg->ops_inflight); |
| 217 | opg->ops_submitter = NULL; |
| 218 | } |
| 219 | spin_unlock(&obj->oo_seatbelt); |
| 220 | |
Jinshan Xiong | 5196e42 | 2016-03-30 19:48:26 -0400 | [diff] [blame] | 221 | osc_lru_del(osc_cli(obj), opg); |
Jinshan Xiong | d9d4790 | 2016-03-30 19:48:28 -0400 | [diff] [blame] | 222 | |
| 223 | if (slice->cpl_page->cp_type == CPT_CACHEABLE) { |
| 224 | void *value; |
| 225 | |
| 226 | spin_lock(&obj->oo_tree_lock); |
| 227 | value = radix_tree_delete(&obj->oo_tree, osc_index(opg)); |
| 228 | if (value) |
| 229 | --obj->oo_npages; |
| 230 | spin_unlock(&obj->oo_tree_lock); |
| 231 | |
| 232 | LASSERT(ergo(value, value == opg)); |
| 233 | } |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 234 | } |
| 235 | |
CHANG FU CHIAO | f6ab21b | 2016-02-06 13:57:48 +0800 | [diff] [blame] | 236 | static void osc_page_clip(const struct lu_env *env, |
| 237 | const struct cl_page_slice *slice, int from, int to) |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 238 | { |
Chris Hanna | 29ac684 | 2015-06-03 10:23:42 -0400 | [diff] [blame] | 239 | struct osc_page *opg = cl2osc_page(slice); |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 240 | struct osc_async_page *oap = &opg->ops_oap; |
| 241 | |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 242 | opg->ops_from = from; |
Chris Hanna | 29ac684 | 2015-06-03 10:23:42 -0400 | [diff] [blame] | 243 | opg->ops_to = to; |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 244 | spin_lock(&oap->oap_lock); |
| 245 | oap->oap_async_flags |= ASYNC_COUNT_STABLE; |
| 246 | spin_unlock(&oap->oap_lock); |
| 247 | } |
| 248 | |
| 249 | static int osc_page_cancel(const struct lu_env *env, |
| 250 | const struct cl_page_slice *slice) |
| 251 | { |
| 252 | struct osc_page *opg = cl2osc_page(slice); |
| 253 | int rc = 0; |
| 254 | |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 255 | /* Check if the transferring against this page |
Oleg Drokin | 30aa9c5 | 2016-02-24 22:00:37 -0500 | [diff] [blame] | 256 | * is completed, or not even queued. |
| 257 | */ |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 258 | if (opg->ops_transfer_pinned) |
| 259 | /* FIXME: may not be interrupted.. */ |
| 260 | rc = osc_cancel_async_page(env, opg); |
| 261 | LASSERT(ergo(rc == 0, opg->ops_transfer_pinned == 0)); |
| 262 | return rc; |
| 263 | } |
| 264 | |
| 265 | static int osc_page_flush(const struct lu_env *env, |
| 266 | const struct cl_page_slice *slice, |
| 267 | struct cl_io *io) |
| 268 | { |
| 269 | struct osc_page *opg = cl2osc_page(slice); |
Julia Lawall | 53a0d48 | 2015-06-20 21:07:53 +0200 | [diff] [blame] | 270 | int rc; |
Greg Kroah-Hartman | 29aaf49 | 2013-08-02 18:14:51 +0800 | [diff] [blame] | 271 | |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 272 | rc = osc_flush_async_page(env, io, opg); |
Greg Kroah-Hartman | 0a3bdb0 | 2013-08-03 10:35:28 +0800 | [diff] [blame] | 273 | return rc; |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 274 | } |
| 275 | |
| 276 | static const struct cl_page_operations osc_page_ops = { |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 277 | .cpo_print = osc_page_print, |
| 278 | .cpo_delete = osc_page_delete, |
| 279 | .cpo_is_under_lock = osc_page_is_under_lock, |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 280 | .cpo_clip = osc_page_clip, |
| 281 | .cpo_cancel = osc_page_cancel, |
| 282 | .cpo_flush = osc_page_flush |
| 283 | }; |
| 284 | |
| 285 | int osc_page_init(const struct lu_env *env, struct cl_object *obj, |
Jinshan Xiong | 7addf40 | 2016-03-30 19:48:32 -0400 | [diff] [blame] | 286 | struct cl_page *page, pgoff_t index) |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 287 | { |
| 288 | struct osc_object *osc = cl2osc(obj); |
Chris Hanna | 29ac684 | 2015-06-03 10:23:42 -0400 | [diff] [blame] | 289 | struct osc_page *opg = cl_object_page_slice(obj, page); |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 290 | int result; |
| 291 | |
| 292 | opg->ops_from = 0; |
Kirill A. Shutemov | 09cbfea | 2016-04-01 15:29:47 +0300 | [diff] [blame] | 293 | opg->ops_to = PAGE_SIZE; |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 294 | |
Jinshan Xiong | 7addf40 | 2016-03-30 19:48:32 -0400 | [diff] [blame] | 295 | result = osc_prep_async_page(osc, opg, page->cp_vmpage, |
| 296 | cl_offset(obj, index)); |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 297 | if (result == 0) { |
| 298 | struct osc_io *oio = osc_env_io(env); |
Mike Rapoport | 50ffcb7 | 2015-10-13 16:03:40 +0300 | [diff] [blame] | 299 | |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 300 | opg->ops_srvlock = osc_io_srvlock(oio); |
Jinshan Xiong | fd7444f | 2016-03-30 19:48:33 -0400 | [diff] [blame] | 301 | cl_page_slice_add(page, &opg->ops_cl, obj, index, |
| 302 | &osc_page_ops); |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 303 | } |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 304 | /* ops_inflight and ops_lru are the same field, but it doesn't |
Oleg Drokin | 30aa9c5 | 2016-02-24 22:00:37 -0500 | [diff] [blame] | 305 | * hurt to initialize it twice :-) |
| 306 | */ |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 307 | INIT_LIST_HEAD(&opg->ops_inflight); |
| 308 | INIT_LIST_HEAD(&opg->ops_lru); |
| 309 | |
| 310 | /* reserve an LRU space for this page */ |
Jinshan Xiong | d9d4790 | 2016-03-30 19:48:28 -0400 | [diff] [blame] | 311 | if (page->cp_type == CPT_CACHEABLE && result == 0) { |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 312 | result = osc_lru_reserve(env, osc, opg); |
Jinshan Xiong | d9d4790 | 2016-03-30 19:48:28 -0400 | [diff] [blame] | 313 | if (result == 0) { |
| 314 | spin_lock(&osc->oo_tree_lock); |
Jinshan Xiong | 7addf40 | 2016-03-30 19:48:32 -0400 | [diff] [blame] | 315 | result = radix_tree_insert(&osc->oo_tree, index, opg); |
Jinshan Xiong | d9d4790 | 2016-03-30 19:48:28 -0400 | [diff] [blame] | 316 | if (result == 0) |
| 317 | ++osc->oo_npages; |
| 318 | spin_unlock(&osc->oo_tree_lock); |
| 319 | LASSERT(result == 0); |
| 320 | } |
| 321 | } |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 322 | |
| 323 | return result; |
| 324 | } |
| 325 | |
Prakash Surya | ad47928 | 2016-04-27 18:21:06 -0400 | [diff] [blame] | 326 | int osc_over_unstable_soft_limit(struct client_obd *cli) |
| 327 | { |
| 328 | long obd_upages, obd_dpages, osc_upages; |
| 329 | |
| 330 | /* Can't check cli->cl_unstable_count, therefore, no soft limit */ |
| 331 | if (!cli) |
| 332 | return 0; |
| 333 | |
| 334 | obd_upages = atomic_read(&obd_unstable_pages); |
| 335 | obd_dpages = atomic_read(&obd_dirty_pages); |
| 336 | |
| 337 | osc_upages = atomic_read(&cli->cl_unstable_count); |
| 338 | |
| 339 | /* |
| 340 | * obd_max_dirty_pages is the max number of (dirty + unstable) |
| 341 | * pages allowed at any given time. To simulate an unstable page |
| 342 | * only limit, we subtract the current number of dirty pages |
| 343 | * from this max. This difference is roughly the amount of pages |
| 344 | * currently available for unstable pages. Thus, the soft limit |
| 345 | * is half of that difference. Check osc_upages to ensure we don't |
| 346 | * set SOFT_SYNC for OSCs without any outstanding unstable pages. |
| 347 | */ |
| 348 | return osc_upages && |
| 349 | obd_upages >= (obd_max_dirty_pages - obd_dpages) / 2; |
| 350 | } |
| 351 | |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 352 | /** |
| 353 | * Helper function called by osc_io_submit() for every page in an immediate |
| 354 | * transfer (i.e., transferred synchronously). |
| 355 | */ |
| 356 | void osc_page_submit(const struct lu_env *env, struct osc_page *opg, |
| 357 | enum cl_req_type crt, int brw_flags) |
| 358 | { |
| 359 | struct osc_async_page *oap = &opg->ops_oap; |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 360 | |
Joe Perches | 2d00bd1 | 2014-11-23 11:28:50 -0800 | [diff] [blame] | 361 | LASSERTF(oap->oap_magic == OAP_MAGIC, "Bad oap magic: oap %p, magic 0x%x\n", |
| 362 | oap, oap->oap_magic); |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 363 | LASSERT(oap->oap_async_flags & ASYNC_READY); |
| 364 | LASSERT(oap->oap_async_flags & ASYNC_COUNT_STABLE); |
| 365 | |
Chris Hanna | 29ac684 | 2015-06-03 10:23:42 -0400 | [diff] [blame] | 366 | oap->oap_cmd = crt == CRT_WRITE ? OBD_BRW_WRITE : OBD_BRW_READ; |
| 367 | oap->oap_page_off = opg->ops_from; |
| 368 | oap->oap_count = opg->ops_to - opg->ops_from; |
Julia Lawall | 40daf5c | 2015-08-29 19:30:11 +0200 | [diff] [blame] | 369 | oap->oap_brw_flags = brw_flags | OBD_BRW_SYNC; |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 370 | |
Prakash Surya | ad47928 | 2016-04-27 18:21:06 -0400 | [diff] [blame] | 371 | if (osc_over_unstable_soft_limit(oap->oap_cli)) |
| 372 | oap->oap_brw_flags |= OBD_BRW_SOFT_SYNC; |
| 373 | |
Fan Yong | 341f1f0 | 2016-06-19 22:53:53 -0400 | [diff] [blame] | 374 | if (capable(CFS_CAP_SYS_RESOURCE)) { |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 375 | oap->oap_brw_flags |= OBD_BRW_NOQUOTA; |
| 376 | oap->oap_cmd |= OBD_BRW_NOQUOTA; |
| 377 | } |
| 378 | |
| 379 | opg->ops_submit_time = cfs_time_current(); |
| 380 | osc_page_transfer_get(opg, "transfer\0imm"); |
| 381 | osc_page_transfer_add(env, opg, crt); |
| 382 | } |
| 383 | |
| 384 | /* --------------- LRU page management ------------------ */ |
| 385 | |
| 386 | /* OSC is a natural place to manage LRU pages as applications are specialized |
| 387 | * to write OSC by OSC. Ideally, if one OSC is used more frequently it should |
| 388 | * occupy more LRU slots. On the other hand, we should avoid using up all LRU |
| 389 | * slots (client_obd::cl_lru_left) otherwise process has to be put into sleep |
| 390 | * for free LRU slots - this will be very bad so the algorithm requires each |
| 391 | * OSC to free slots voluntarily to maintain a reasonable number of free slots |
| 392 | * at any time. |
| 393 | */ |
| 394 | |
Greg Kroah-Hartman | 2f5723a | 2013-08-04 08:39:49 +0800 | [diff] [blame] | 395 | static DECLARE_WAIT_QUEUE_HEAD(osc_lru_waitq); |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 396 | /* LRU pages are freed in batch mode. OSC should at least free this |
Oleg Drokin | 30aa9c5 | 2016-02-24 22:00:37 -0500 | [diff] [blame] | 397 | * number of pages to avoid running out of LRU budget, and.. |
| 398 | */ |
Kirill A. Shutemov | 09cbfea | 2016-04-01 15:29:47 +0300 | [diff] [blame] | 399 | static const int lru_shrink_min = 2 << (20 - PAGE_SHIFT); /* 2M */ |
Masanari Iida | 11d66e8 | 2013-12-14 02:24:04 +0900 | [diff] [blame] | 400 | /* free this number at most otherwise it will take too long time to finish. */ |
Greg Kroah-Hartman | 5f47992 | 2016-04-11 09:30:50 -0700 | [diff] [blame] | 401 | static const int lru_shrink_max = 8 << (20 - PAGE_SHIFT); /* 8M */ |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 402 | |
| 403 | /* Check if we can free LRU slots from this OSC. If there exists LRU waiters, |
| 404 | * we should free slots aggressively. In this way, slots are freed in a steady |
| 405 | * step to maintain fairness among OSCs. |
| 406 | * |
Oleg Drokin | 30aa9c5 | 2016-02-24 22:00:37 -0500 | [diff] [blame] | 407 | * Return how many LRU pages should be freed. |
| 408 | */ |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 409 | static int osc_cache_too_much(struct client_obd *cli) |
| 410 | { |
| 411 | struct cl_client_cache *cache = cli->cl_cache; |
Jinshan Xiong | 5196e42 | 2016-03-30 19:48:26 -0400 | [diff] [blame] | 412 | int pages = atomic_read(&cli->cl_lru_in_list); |
| 413 | unsigned long budget; |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 414 | |
Emoly Liu | 1b02bde | 2016-06-20 16:55:24 -0400 | [diff] [blame] | 415 | budget = cache->ccc_lru_max / (atomic_read(&cache->ccc_users) - 2); |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 416 | |
| 417 | /* if it's going to run out LRU slots, we should free some, but not |
Oleg Drokin | 30aa9c5 | 2016-02-24 22:00:37 -0500 | [diff] [blame] | 418 | * too much to maintain fairness among OSCs. |
| 419 | */ |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 420 | if (atomic_read(cli->cl_lru_left) < cache->ccc_lru_max >> 4) { |
Jinshan Xiong | 5196e42 | 2016-03-30 19:48:26 -0400 | [diff] [blame] | 421 | if (pages >= budget) |
| 422 | return lru_shrink_max; |
| 423 | else if (pages >= budget / 2) |
| 424 | return lru_shrink_min; |
Oleg Drokin | da5ecb4 | 2016-04-01 15:18:01 -0400 | [diff] [blame] | 425 | } else if (pages >= budget * 2) { |
Jinshan Xiong | 5196e42 | 2016-03-30 19:48:26 -0400 | [diff] [blame] | 426 | return lru_shrink_min; |
Oleg Drokin | da5ecb4 | 2016-04-01 15:18:01 -0400 | [diff] [blame] | 427 | } |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 428 | return 0; |
| 429 | } |
| 430 | |
Jinshan Xiong | 2579d8d | 2016-03-30 19:48:27 -0400 | [diff] [blame] | 431 | int lru_queue_work(const struct lu_env *env, void *data) |
| 432 | { |
| 433 | struct client_obd *cli = data; |
| 434 | |
| 435 | CDEBUG(D_CACHE, "Run LRU work for client obd %p.\n", cli); |
| 436 | |
| 437 | if (osc_cache_too_much(cli)) |
| 438 | osc_lru_shrink(env, cli, lru_shrink_max, true); |
| 439 | |
| 440 | return 0; |
| 441 | } |
| 442 | |
Jinshan Xiong | 5196e42 | 2016-03-30 19:48:26 -0400 | [diff] [blame] | 443 | void osc_lru_add_batch(struct client_obd *cli, struct list_head *plist) |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 444 | { |
Jinshan Xiong | 5196e42 | 2016-03-30 19:48:26 -0400 | [diff] [blame] | 445 | LIST_HEAD(lru); |
| 446 | struct osc_async_page *oap; |
| 447 | int npages = 0; |
| 448 | |
| 449 | list_for_each_entry(oap, plist, oap_pending_item) { |
| 450 | struct osc_page *opg = oap2osc_page(oap); |
| 451 | |
| 452 | if (!opg->ops_in_lru) |
| 453 | continue; |
| 454 | |
| 455 | ++npages; |
| 456 | LASSERT(list_empty(&opg->ops_lru)); |
| 457 | list_add(&opg->ops_lru, &lru); |
| 458 | } |
| 459 | |
| 460 | if (npages > 0) { |
John L. Hammond | 7d53d8f | 2016-03-30 19:48:36 -0400 | [diff] [blame] | 461 | spin_lock(&cli->cl_lru_list_lock); |
Jinshan Xiong | 5196e42 | 2016-03-30 19:48:26 -0400 | [diff] [blame] | 462 | list_splice_tail(&lru, &cli->cl_lru_list); |
| 463 | atomic_sub(npages, &cli->cl_lru_busy); |
| 464 | atomic_add(npages, &cli->cl_lru_in_list); |
John L. Hammond | 7d53d8f | 2016-03-30 19:48:36 -0400 | [diff] [blame] | 465 | spin_unlock(&cli->cl_lru_list_lock); |
Jinshan Xiong | 5196e42 | 2016-03-30 19:48:26 -0400 | [diff] [blame] | 466 | |
| 467 | /* XXX: May set force to be true for better performance */ |
Jinshan Xiong | 2579d8d | 2016-03-30 19:48:27 -0400 | [diff] [blame] | 468 | if (osc_cache_too_much(cli)) |
| 469 | (void)ptlrpcd_queue_work(cli->cl_lru_work); |
Jinshan Xiong | 5196e42 | 2016-03-30 19:48:26 -0400 | [diff] [blame] | 470 | } |
| 471 | } |
| 472 | |
| 473 | static void __osc_lru_del(struct client_obd *cli, struct osc_page *opg) |
| 474 | { |
| 475 | LASSERT(atomic_read(&cli->cl_lru_in_list) > 0); |
| 476 | list_del_init(&opg->ops_lru); |
| 477 | atomic_dec(&cli->cl_lru_in_list); |
| 478 | } |
| 479 | |
| 480 | /** |
| 481 | * Page is being destroyed. The page may be not in LRU list, if the transfer |
| 482 | * has never finished(error occurred). |
| 483 | */ |
| 484 | static void osc_lru_del(struct client_obd *cli, struct osc_page *opg) |
| 485 | { |
| 486 | if (opg->ops_in_lru) { |
John L. Hammond | 7d53d8f | 2016-03-30 19:48:36 -0400 | [diff] [blame] | 487 | spin_lock(&cli->cl_lru_list_lock); |
Jinshan Xiong | 5196e42 | 2016-03-30 19:48:26 -0400 | [diff] [blame] | 488 | if (!list_empty(&opg->ops_lru)) { |
| 489 | __osc_lru_del(cli, opg); |
| 490 | } else { |
| 491 | LASSERT(atomic_read(&cli->cl_lru_busy) > 0); |
| 492 | atomic_dec(&cli->cl_lru_busy); |
| 493 | } |
John L. Hammond | 7d53d8f | 2016-03-30 19:48:36 -0400 | [diff] [blame] | 494 | spin_unlock(&cli->cl_lru_list_lock); |
Jinshan Xiong | 5196e42 | 2016-03-30 19:48:26 -0400 | [diff] [blame] | 495 | |
| 496 | atomic_inc(cli->cl_lru_left); |
| 497 | /* this is a great place to release more LRU pages if |
| 498 | * this osc occupies too many LRU pages and kernel is |
| 499 | * stealing one of them. |
| 500 | */ |
| 501 | if (!memory_pressure_get()) |
Jinshan Xiong | 2579d8d | 2016-03-30 19:48:27 -0400 | [diff] [blame] | 502 | (void)ptlrpcd_queue_work(cli->cl_lru_work); |
Jinshan Xiong | 5196e42 | 2016-03-30 19:48:26 -0400 | [diff] [blame] | 503 | wake_up(&osc_lru_waitq); |
| 504 | } else { |
| 505 | LASSERT(list_empty(&opg->ops_lru)); |
| 506 | } |
| 507 | } |
| 508 | |
| 509 | /** |
| 510 | * Delete page from LRUlist for redirty. |
| 511 | */ |
| 512 | static void osc_lru_use(struct client_obd *cli, struct osc_page *opg) |
| 513 | { |
| 514 | /* If page is being transferred for the first time, |
| 515 | * ops_lru should be empty |
| 516 | */ |
| 517 | if (opg->ops_in_lru && !list_empty(&opg->ops_lru)) { |
John L. Hammond | 7d53d8f | 2016-03-30 19:48:36 -0400 | [diff] [blame] | 518 | spin_lock(&cli->cl_lru_list_lock); |
Jinshan Xiong | 5196e42 | 2016-03-30 19:48:26 -0400 | [diff] [blame] | 519 | __osc_lru_del(cli, opg); |
John L. Hammond | 7d53d8f | 2016-03-30 19:48:36 -0400 | [diff] [blame] | 520 | spin_unlock(&cli->cl_lru_list_lock); |
Jinshan Xiong | 5196e42 | 2016-03-30 19:48:26 -0400 | [diff] [blame] | 521 | atomic_inc(&cli->cl_lru_busy); |
| 522 | } |
| 523 | } |
| 524 | |
| 525 | static void discard_pagevec(const struct lu_env *env, struct cl_io *io, |
| 526 | struct cl_page **pvec, int max_index) |
| 527 | { |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 528 | int i; |
| 529 | |
Jinshan Xiong | 5196e42 | 2016-03-30 19:48:26 -0400 | [diff] [blame] | 530 | for (i = 0; i < max_index; i++) { |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 531 | struct cl_page *page = pvec[i]; |
Mike Rapoport | 50ffcb7 | 2015-10-13 16:03:40 +0300 | [diff] [blame] | 532 | |
Jinshan Xiong | 5196e42 | 2016-03-30 19:48:26 -0400 | [diff] [blame] | 533 | LASSERT(cl_page_is_owned(page, io)); |
Jinshan Xiong | 5196e42 | 2016-03-30 19:48:26 -0400 | [diff] [blame] | 534 | cl_page_discard(env, io, page); |
| 535 | cl_page_disown(env, io, page); |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 536 | cl_page_put(env, page); |
Jinshan Xiong | 5196e42 | 2016-03-30 19:48:26 -0400 | [diff] [blame] | 537 | |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 538 | pvec[i] = NULL; |
| 539 | } |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 540 | } |
| 541 | |
| 542 | /** |
| 543 | * Drop @target of pages from LRU at most. |
| 544 | */ |
Jinshan Xiong | 2579d8d | 2016-03-30 19:48:27 -0400 | [diff] [blame] | 545 | int osc_lru_shrink(const struct lu_env *env, struct client_obd *cli, |
| 546 | int target, bool force) |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 547 | { |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 548 | struct cl_io *io; |
| 549 | struct cl_object *clobj = NULL; |
| 550 | struct cl_page **pvec; |
| 551 | struct osc_page *opg; |
Bhaktipriya Shridhar | 8adddc3 | 2016-03-12 01:36:51 +0530 | [diff] [blame] | 552 | struct osc_page *temp; |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 553 | int maxscan = 0; |
| 554 | int count = 0; |
| 555 | int index = 0; |
| 556 | int rc = 0; |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 557 | |
| 558 | LASSERT(atomic_read(&cli->cl_lru_in_list) >= 0); |
| 559 | if (atomic_read(&cli->cl_lru_in_list) == 0 || target <= 0) |
Greg Kroah-Hartman | 0a3bdb0 | 2013-08-03 10:35:28 +0800 | [diff] [blame] | 560 | return 0; |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 561 | |
Jinshan Xiong | 5196e42 | 2016-03-30 19:48:26 -0400 | [diff] [blame] | 562 | if (!force) { |
| 563 | if (atomic_read(&cli->cl_lru_shrinkers) > 0) |
| 564 | return -EBUSY; |
| 565 | |
| 566 | if (atomic_inc_return(&cli->cl_lru_shrinkers) > 1) { |
| 567 | atomic_dec(&cli->cl_lru_shrinkers); |
| 568 | return -EBUSY; |
| 569 | } |
| 570 | } else { |
| 571 | atomic_inc(&cli->cl_lru_shrinkers); |
| 572 | } |
| 573 | |
Jinshan Xiong | d9d4790 | 2016-03-30 19:48:28 -0400 | [diff] [blame] | 574 | pvec = (struct cl_page **)osc_env_info(env)->oti_pvec; |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 575 | io = &osc_env_info(env)->oti_io; |
| 576 | |
John L. Hammond | 7d53d8f | 2016-03-30 19:48:36 -0400 | [diff] [blame] | 577 | spin_lock(&cli->cl_lru_list_lock); |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 578 | maxscan = min(target << 1, atomic_read(&cli->cl_lru_in_list)); |
Bhaktipriya Shridhar | 8adddc3 | 2016-03-12 01:36:51 +0530 | [diff] [blame] | 579 | list_for_each_entry_safe(opg, temp, &cli->cl_lru_list, ops_lru) { |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 580 | struct cl_page *page; |
Jinshan Xiong | 5196e42 | 2016-03-30 19:48:26 -0400 | [diff] [blame] | 581 | bool will_free = false; |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 582 | |
| 583 | if (--maxscan < 0) |
| 584 | break; |
| 585 | |
Jinshan Xiong | 7addf40 | 2016-03-30 19:48:32 -0400 | [diff] [blame] | 586 | page = opg->ops_cl.cpl_page; |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 587 | if (cl_page_in_use_noref(page)) { |
| 588 | list_move_tail(&opg->ops_lru, &cli->cl_lru_list); |
| 589 | continue; |
| 590 | } |
| 591 | |
Oleg Drokin | 7f1ae4c | 2016-02-16 00:46:57 -0500 | [diff] [blame] | 592 | LASSERT(page->cp_obj); |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 593 | if (clobj != page->cp_obj) { |
| 594 | struct cl_object *tmp = page->cp_obj; |
| 595 | |
| 596 | cl_object_get(tmp); |
John L. Hammond | 7d53d8f | 2016-03-30 19:48:36 -0400 | [diff] [blame] | 597 | spin_unlock(&cli->cl_lru_list_lock); |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 598 | |
Oleg Drokin | 7f1ae4c | 2016-02-16 00:46:57 -0500 | [diff] [blame] | 599 | if (clobj) { |
Jinshan Xiong | 5196e42 | 2016-03-30 19:48:26 -0400 | [diff] [blame] | 600 | discard_pagevec(env, io, pvec, index); |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 601 | index = 0; |
| 602 | |
| 603 | cl_io_fini(env, io); |
| 604 | cl_object_put(env, clobj); |
| 605 | clobj = NULL; |
| 606 | } |
| 607 | |
| 608 | clobj = tmp; |
| 609 | io->ci_obj = clobj; |
| 610 | io->ci_ignore_layout = 1; |
| 611 | rc = cl_io_init(env, io, CIT_MISC, clobj); |
| 612 | |
John L. Hammond | 7d53d8f | 2016-03-30 19:48:36 -0400 | [diff] [blame] | 613 | spin_lock(&cli->cl_lru_list_lock); |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 614 | |
| 615 | if (rc != 0) |
| 616 | break; |
| 617 | |
| 618 | ++maxscan; |
| 619 | continue; |
| 620 | } |
| 621 | |
Jinshan Xiong | 5196e42 | 2016-03-30 19:48:26 -0400 | [diff] [blame] | 622 | if (cl_page_own_try(env, io, page) == 0) { |
| 623 | if (!cl_page_in_use_noref(page)) { |
| 624 | /* remove it from lru list earlier to avoid |
| 625 | * lock contention |
| 626 | */ |
| 627 | __osc_lru_del(cli, opg); |
| 628 | opg->ops_in_lru = 0; /* will be discarded */ |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 629 | |
Jinshan Xiong | 5196e42 | 2016-03-30 19:48:26 -0400 | [diff] [blame] | 630 | cl_page_get(page); |
| 631 | will_free = true; |
| 632 | } else { |
| 633 | cl_page_disown(env, io, page); |
| 634 | } |
| 635 | } |
| 636 | |
| 637 | if (!will_free) { |
| 638 | list_move_tail(&opg->ops_lru, &cli->cl_lru_list); |
| 639 | continue; |
| 640 | } |
| 641 | |
| 642 | /* Don't discard and free the page with cl_lru_list held */ |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 643 | pvec[index++] = page; |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 644 | if (unlikely(index == OTI_PVEC_SIZE)) { |
John L. Hammond | 7d53d8f | 2016-03-30 19:48:36 -0400 | [diff] [blame] | 645 | spin_unlock(&cli->cl_lru_list_lock); |
Jinshan Xiong | 5196e42 | 2016-03-30 19:48:26 -0400 | [diff] [blame] | 646 | discard_pagevec(env, io, pvec, index); |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 647 | index = 0; |
| 648 | |
John L. Hammond | 7d53d8f | 2016-03-30 19:48:36 -0400 | [diff] [blame] | 649 | spin_lock(&cli->cl_lru_list_lock); |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 650 | } |
Jinshan Xiong | 5196e42 | 2016-03-30 19:48:26 -0400 | [diff] [blame] | 651 | |
| 652 | if (++count >= target) |
| 653 | break; |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 654 | } |
John L. Hammond | 7d53d8f | 2016-03-30 19:48:36 -0400 | [diff] [blame] | 655 | spin_unlock(&cli->cl_lru_list_lock); |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 656 | |
Oleg Drokin | 7f1ae4c | 2016-02-16 00:46:57 -0500 | [diff] [blame] | 657 | if (clobj) { |
Jinshan Xiong | 5196e42 | 2016-03-30 19:48:26 -0400 | [diff] [blame] | 658 | discard_pagevec(env, io, pvec, index); |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 659 | |
| 660 | cl_io_fini(env, io); |
| 661 | cl_object_put(env, clobj); |
| 662 | } |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 663 | |
| 664 | atomic_dec(&cli->cl_lru_shrinkers); |
Jinshan Xiong | 5196e42 | 2016-03-30 19:48:26 -0400 | [diff] [blame] | 665 | if (count > 0) { |
| 666 | atomic_add(count, cli->cl_lru_left); |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 667 | wake_up_all(&osc_lru_waitq); |
| 668 | } |
Jinshan Xiong | 5196e42 | 2016-03-30 19:48:26 -0400 | [diff] [blame] | 669 | return count > 0 ? count : rc; |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 670 | } |
| 671 | |
| 672 | static inline int max_to_shrink(struct client_obd *cli) |
| 673 | { |
| 674 | return min(atomic_read(&cli->cl_lru_in_list) >> 1, lru_shrink_max); |
| 675 | } |
| 676 | |
Jinshan Xiong | 5196e42 | 2016-03-30 19:48:26 -0400 | [diff] [blame] | 677 | int osc_lru_reclaim(struct client_obd *cli) |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 678 | { |
Jinshan Xiong | 2579d8d | 2016-03-30 19:48:27 -0400 | [diff] [blame] | 679 | struct cl_env_nest nest; |
| 680 | struct lu_env *env; |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 681 | struct cl_client_cache *cache = cli->cl_cache; |
| 682 | int max_scans; |
Jinshan Xiong | 5196e42 | 2016-03-30 19:48:26 -0400 | [diff] [blame] | 683 | int rc = 0; |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 684 | |
Oleg Drokin | 7f1ae4c | 2016-02-16 00:46:57 -0500 | [diff] [blame] | 685 | LASSERT(cache); |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 686 | |
Jinshan Xiong | 2579d8d | 2016-03-30 19:48:27 -0400 | [diff] [blame] | 687 | env = cl_env_nested_get(&nest); |
| 688 | if (IS_ERR(env)) |
| 689 | return 0; |
| 690 | |
| 691 | rc = osc_lru_shrink(env, cli, osc_cache_too_much(cli), false); |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 692 | if (rc != 0) { |
Jinshan Xiong | 5196e42 | 2016-03-30 19:48:26 -0400 | [diff] [blame] | 693 | if (rc == -EBUSY) |
| 694 | rc = 0; |
| 695 | |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 696 | CDEBUG(D_CACHE, "%s: Free %d pages from own LRU: %p.\n", |
Oleg Drokin | 79910d7 | 2016-02-26 01:50:03 -0500 | [diff] [blame] | 697 | cli->cl_import->imp_obd->obd_name, rc, cli); |
Jinshan Xiong | 2579d8d | 2016-03-30 19:48:27 -0400 | [diff] [blame] | 698 | goto out; |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 699 | } |
| 700 | |
| 701 | CDEBUG(D_CACHE, "%s: cli %p no free slots, pages: %d, busy: %d.\n", |
Oleg Drokin | 79910d7 | 2016-02-26 01:50:03 -0500 | [diff] [blame] | 702 | cli->cl_import->imp_obd->obd_name, cli, |
| 703 | atomic_read(&cli->cl_lru_in_list), |
| 704 | atomic_read(&cli->cl_lru_busy)); |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 705 | |
| 706 | /* Reclaim LRU slots from other client_obd as it can't free enough |
Oleg Drokin | 30aa9c5 | 2016-02-24 22:00:37 -0500 | [diff] [blame] | 707 | * from its own. This should rarely happen. |
| 708 | */ |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 709 | spin_lock(&cache->ccc_lru_lock); |
Hiroya Nozaki | 0df83c1 | 2015-09-14 18:41:25 -0400 | [diff] [blame] | 710 | LASSERT(!list_empty(&cache->ccc_lru)); |
| 711 | |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 712 | cache->ccc_lru_shrinkers++; |
| 713 | list_move_tail(&cli->cl_lru_osc, &cache->ccc_lru); |
| 714 | |
Emoly Liu | 1b02bde | 2016-06-20 16:55:24 -0400 | [diff] [blame] | 715 | max_scans = atomic_read(&cache->ccc_users) - 2; |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 716 | while (--max_scans > 0 && !list_empty(&cache->ccc_lru)) { |
| 717 | cli = list_entry(cache->ccc_lru.next, struct client_obd, |
Oleg Drokin | 79910d7 | 2016-02-26 01:50:03 -0500 | [diff] [blame] | 718 | cl_lru_osc); |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 719 | |
| 720 | CDEBUG(D_CACHE, "%s: cli %p LRU pages: %d, busy: %d.\n", |
Oleg Drokin | 79910d7 | 2016-02-26 01:50:03 -0500 | [diff] [blame] | 721 | cli->cl_import->imp_obd->obd_name, cli, |
| 722 | atomic_read(&cli->cl_lru_in_list), |
| 723 | atomic_read(&cli->cl_lru_busy)); |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 724 | |
| 725 | list_move_tail(&cli->cl_lru_osc, &cache->ccc_lru); |
Jinshan Xiong | 5196e42 | 2016-03-30 19:48:26 -0400 | [diff] [blame] | 726 | if (osc_cache_too_much(cli) > 0) { |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 727 | spin_unlock(&cache->ccc_lru_lock); |
| 728 | |
Jinshan Xiong | 2579d8d | 2016-03-30 19:48:27 -0400 | [diff] [blame] | 729 | rc = osc_lru_shrink(env, cli, osc_cache_too_much(cli), |
| 730 | true); |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 731 | spin_lock(&cache->ccc_lru_lock); |
| 732 | if (rc != 0) |
| 733 | break; |
| 734 | } |
| 735 | } |
| 736 | spin_unlock(&cache->ccc_lru_lock); |
| 737 | |
Jinshan Xiong | 2579d8d | 2016-03-30 19:48:27 -0400 | [diff] [blame] | 738 | out: |
| 739 | cl_env_nested_put(&nest, env); |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 740 | CDEBUG(D_CACHE, "%s: cli %p freed %d pages.\n", |
Oleg Drokin | 79910d7 | 2016-02-26 01:50:03 -0500 | [diff] [blame] | 741 | cli->cl_import->imp_obd->obd_name, cli, rc); |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 742 | return rc; |
| 743 | } |
| 744 | |
| 745 | static int osc_lru_reserve(const struct lu_env *env, struct osc_object *obj, |
| 746 | struct osc_page *opg) |
| 747 | { |
| 748 | struct l_wait_info lwi = LWI_INTR(LWI_ON_SIGNAL_NOOP, NULL); |
Jinshan Xiong | 5196e42 | 2016-03-30 19:48:26 -0400 | [diff] [blame] | 749 | struct osc_io *oio = osc_env_io(env); |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 750 | struct client_obd *cli = osc_cli(obj); |
| 751 | int rc = 0; |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 752 | |
Oleg Drokin | 7f1ae4c | 2016-02-16 00:46:57 -0500 | [diff] [blame] | 753 | if (!cli->cl_cache) /* shall not be in LRU */ |
Greg Kroah-Hartman | 0a3bdb0 | 2013-08-03 10:35:28 +0800 | [diff] [blame] | 754 | return 0; |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 755 | |
Jinshan Xiong | 5196e42 | 2016-03-30 19:48:26 -0400 | [diff] [blame] | 756 | if (oio->oi_lru_reserved > 0) { |
| 757 | --oio->oi_lru_reserved; |
| 758 | goto out; |
| 759 | } |
| 760 | |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 761 | LASSERT(atomic_read(cli->cl_lru_left) >= 0); |
Greg Kroah-Hartman | 305ec768 | 2013-08-04 08:03:39 +0800 | [diff] [blame] | 762 | while (!atomic_add_unless(cli->cl_lru_left, -1, 0)) { |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 763 | /* run out of LRU spaces, try to drop some by itself */ |
| 764 | rc = osc_lru_reclaim(cli); |
| 765 | if (rc < 0) |
| 766 | break; |
| 767 | if (rc > 0) |
| 768 | continue; |
| 769 | |
| 770 | cond_resched(); |
| 771 | |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 772 | rc = l_wait_event(osc_lru_waitq, |
Jinshan Xiong | 5196e42 | 2016-03-30 19:48:26 -0400 | [diff] [blame] | 773 | atomic_read(cli->cl_lru_left) > 0, |
Oleg Drokin | 79910d7 | 2016-02-26 01:50:03 -0500 | [diff] [blame] | 774 | &lwi); |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 775 | |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 776 | if (rc < 0) |
| 777 | break; |
| 778 | } |
| 779 | |
Jinshan Xiong | 5196e42 | 2016-03-30 19:48:26 -0400 | [diff] [blame] | 780 | out: |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 781 | if (rc >= 0) { |
| 782 | atomic_inc(&cli->cl_lru_busy); |
| 783 | opg->ops_in_lru = 1; |
| 784 | rc = 0; |
| 785 | } |
| 786 | |
Greg Kroah-Hartman | 0a3bdb0 | 2013-08-03 10:35:28 +0800 | [diff] [blame] | 787 | return rc; |
Peng Tao | d7e09d0 | 2013-05-02 16:46:55 +0800 | [diff] [blame] | 788 | } |
| 789 | |
| 790 | /** @} osc */ |