blob: 153e990c494e6f66bbb10541b17382f547e1eb5d [file] [log] [blame]
Peng Taod7e09d02013-05-02 16:46:55 +08001/*
2 * GPL HEADER START
3 *
4 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
5 *
6 * This program is free software; you can redistribute it and/or modify
7 * it under the terms of the GNU General Public License version 2 only,
8 * as published by the Free Software Foundation.
9 *
10 * This program is distributed in the hope that it will be useful, but
11 * WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
13 * General Public License version 2 for more details (a copy is included
14 * in the LICENSE file that accompanied this code).
15 *
16 * You should have received a copy of the GNU General Public License
17 * version 2 along with this program; If not, see
Oleg Drokin6a5b99a2016-06-14 23:33:40 -040018 * http://www.gnu.org/licenses/gpl-2.0.html
Peng Taod7e09d02013-05-02 16:46:55 +080019 *
Peng Taod7e09d02013-05-02 16:46:55 +080020 * GPL HEADER END
21 */
22/*
23 * Copyright (c) 2003, 2010, Oracle and/or its affiliates. All rights reserved.
24 * Use is subject to license terms.
25 *
Andreas Dilger1dc563a2015-11-08 18:09:37 -050026 * Copyright (c) 2010, 2015, Intel Corporation.
Peng Taod7e09d02013-05-02 16:46:55 +080027 */
28/*
29 * This file is part of Lustre, http://www.lustre.org/
30 * Lustre is a trademark of Sun Microsystems, Inc.
31 */
32
33/**
34 * This file deals with various client/target related logic including recovery.
35 *
36 * TODO: This code more logically belongs in the ptlrpc module than in ldlm and
37 * should be moved.
38 */
39
40#define DEBUG_SUBSYSTEM S_LDLM
41
Greg Kroah-Hartman9fdaf8c2014-07-11 20:51:16 -070042#include "../../include/linux/libcfs/libcfs.h"
Greg Kroah-Hartmane27db142014-07-11 22:29:36 -070043#include "../include/obd.h"
44#include "../include/obd_class.h"
45#include "../include/lustre_dlm.h"
46#include "../include/lustre_net.h"
47#include "../include/lustre_sec.h"
Peng Taod7e09d02013-05-02 16:46:55 +080048#include "ldlm_internal.h"
49
50/* @priority: If non-zero, move the selected connection to the list head.
51 * @create: If zero, only search in existing connections.
52 */
53static int import_set_conn(struct obd_import *imp, struct obd_uuid *uuid,
54 int priority, int create)
55{
56 struct ptlrpc_connection *ptlrpc_conn;
57 struct obd_import_conn *imp_conn = NULL, *item;
58 int rc = 0;
Peng Taod7e09d02013-05-02 16:46:55 +080059
60 if (!create && !priority) {
61 CDEBUG(D_HA, "Nothing to do\n");
Greg Kroah-Hartman0a3bdb02013-08-03 10:35:28 +080062 return -EINVAL;
Peng Taod7e09d02013-05-02 16:46:55 +080063 }
64
65 ptlrpc_conn = ptlrpc_uuid_to_connection(uuid);
66 if (!ptlrpc_conn) {
67 CDEBUG(D_HA, "can't find connection %s\n", uuid->uuid);
Greg Kroah-Hartman0a3bdb02013-08-03 10:35:28 +080068 return -ENOENT;
Peng Taod7e09d02013-05-02 16:46:55 +080069 }
70
71 if (create) {
Julia Lawall352f7892015-05-01 17:51:19 +020072 imp_conn = kzalloc(sizeof(*imp_conn), GFP_NOFS);
Julia Lawalld1c0d442014-09-01 22:21:09 +020073 if (!imp_conn) {
74 rc = -ENOMEM;
75 goto out_put;
76 }
Peng Taod7e09d02013-05-02 16:46:55 +080077 }
78
79 spin_lock(&imp->imp_lock);
80 list_for_each_entry(item, &imp->imp_conn_list, oic_item) {
81 if (obd_uuid_equals(uuid, &item->oic_uuid)) {
82 if (priority) {
83 list_del(&item->oic_item);
84 list_add(&item->oic_item,
Oleg Drokin24c198e2016-08-21 18:04:35 -040085 &imp->imp_conn_list);
Peng Taod7e09d02013-05-02 16:46:55 +080086 item->oic_last_attempt = 0;
87 }
88 CDEBUG(D_HA, "imp %p@%s: found existing conn %s%s\n",
89 imp, imp->imp_obd->obd_name, uuid->uuid,
90 (priority ? ", moved to head" : ""));
91 spin_unlock(&imp->imp_lock);
Julia Lawalld1c0d442014-09-01 22:21:09 +020092 rc = 0;
93 goto out_free;
Peng Taod7e09d02013-05-02 16:46:55 +080094 }
95 }
96 /* No existing import connection found for \a uuid. */
97 if (create) {
98 imp_conn->oic_conn = ptlrpc_conn;
99 imp_conn->oic_uuid = *uuid;
100 imp_conn->oic_last_attempt = 0;
101 if (priority)
102 list_add(&imp_conn->oic_item, &imp->imp_conn_list);
103 else
104 list_add_tail(&imp_conn->oic_item,
Oleg Drokin24c198e2016-08-21 18:04:35 -0400105 &imp->imp_conn_list);
Peng Taod7e09d02013-05-02 16:46:55 +0800106 CDEBUG(D_HA, "imp %p@%s: add connection %s at %s\n",
107 imp, imp->imp_obd->obd_name, uuid->uuid,
108 (priority ? "head" : "tail"));
109 } else {
110 spin_unlock(&imp->imp_lock);
Julia Lawalld1c0d442014-09-01 22:21:09 +0200111 rc = -ENOENT;
112 goto out_free;
Peng Taod7e09d02013-05-02 16:46:55 +0800113 }
114
115 spin_unlock(&imp->imp_lock);
Greg Kroah-Hartman0a3bdb02013-08-03 10:35:28 +0800116 return 0;
Peng Taod7e09d02013-05-02 16:46:55 +0800117out_free:
Julia Lawall11345072015-05-01 21:38:06 +0200118 kfree(imp_conn);
Peng Taod7e09d02013-05-02 16:46:55 +0800119out_put:
120 ptlrpc_connection_put(ptlrpc_conn);
Greg Kroah-Hartman0a3bdb02013-08-03 10:35:28 +0800121 return rc;
Peng Taod7e09d02013-05-02 16:46:55 +0800122}
123
124int import_set_conn_priority(struct obd_import *imp, struct obd_uuid *uuid)
125{
126 return import_set_conn(imp, uuid, 1, 0);
127}
128
129int client_import_add_conn(struct obd_import *imp, struct obd_uuid *uuid,
130 int priority)
131{
132 return import_set_conn(imp, uuid, priority, 1);
133}
134EXPORT_SYMBOL(client_import_add_conn);
135
136int client_import_del_conn(struct obd_import *imp, struct obd_uuid *uuid)
137{
138 struct obd_import_conn *imp_conn;
139 struct obd_export *dlmexp;
140 int rc = -ENOENT;
Peng Taod7e09d02013-05-02 16:46:55 +0800141
142 spin_lock(&imp->imp_lock);
143 if (list_empty(&imp->imp_conn_list)) {
144 LASSERT(!imp->imp_connection);
Julia Lawalld1c0d442014-09-01 22:21:09 +0200145 goto out;
Peng Taod7e09d02013-05-02 16:46:55 +0800146 }
147
148 list_for_each_entry(imp_conn, &imp->imp_conn_list, oic_item) {
149 if (!obd_uuid_equals(uuid, &imp_conn->oic_uuid))
150 continue;
151 LASSERT(imp_conn->oic_conn);
152
153 if (imp_conn == imp->imp_conn_current) {
154 LASSERT(imp_conn->oic_conn == imp->imp_connection);
155
156 if (imp->imp_state != LUSTRE_IMP_CLOSED &&
157 imp->imp_state != LUSTRE_IMP_DISCON) {
158 CERROR("can't remove current connection\n");
Julia Lawalld1c0d442014-09-01 22:21:09 +0200159 rc = -EBUSY;
160 goto out;
Peng Taod7e09d02013-05-02 16:46:55 +0800161 }
162
163 ptlrpc_connection_put(imp->imp_connection);
164 imp->imp_connection = NULL;
165
166 dlmexp = class_conn2export(&imp->imp_dlm_handle);
167 if (dlmexp && dlmexp->exp_connection) {
168 LASSERT(dlmexp->exp_connection ==
169 imp_conn->oic_conn);
170 ptlrpc_connection_put(dlmexp->exp_connection);
171 dlmexp->exp_connection = NULL;
172 }
173 }
174
175 list_del(&imp_conn->oic_item);
176 ptlrpc_connection_put(imp_conn->oic_conn);
Julia Lawall352f7892015-05-01 17:51:19 +0200177 kfree(imp_conn);
Peng Taod7e09d02013-05-02 16:46:55 +0800178 CDEBUG(D_HA, "imp %p@%s: remove connection %s\n",
179 imp, imp->imp_obd->obd_name, uuid->uuid);
180 rc = 0;
181 break;
182 }
183out:
184 spin_unlock(&imp->imp_lock);
185 if (rc == -ENOENT)
186 CERROR("connection %s not found\n", uuid->uuid);
Greg Kroah-Hartman0a3bdb02013-08-03 10:35:28 +0800187 return rc;
Peng Taod7e09d02013-05-02 16:46:55 +0800188}
189EXPORT_SYMBOL(client_import_del_conn);
190
191/**
192 * Find conn UUID by peer NID. \a peer is a server NID. This function is used
193 * to find a conn uuid of \a imp which can reach \a peer.
194 */
195int client_import_find_conn(struct obd_import *imp, lnet_nid_t peer,
196 struct obd_uuid *uuid)
197{
198 struct obd_import_conn *conn;
199 int rc = -ENOENT;
Peng Taod7e09d02013-05-02 16:46:55 +0800200
201 spin_lock(&imp->imp_lock);
202 list_for_each_entry(conn, &imp->imp_conn_list, oic_item) {
203 /* Check if conn UUID does have this peer NID. */
204 if (class_check_uuid(&conn->oic_uuid, peer)) {
205 *uuid = conn->oic_uuid;
206 rc = 0;
207 break;
208 }
209 }
210 spin_unlock(&imp->imp_lock);
Greg Kroah-Hartman0a3bdb02013-08-03 10:35:28 +0800211 return rc;
Peng Taod7e09d02013-05-02 16:46:55 +0800212}
213EXPORT_SYMBOL(client_import_find_conn);
214
215void client_destroy_import(struct obd_import *imp)
216{
217 /* Drop security policy instance after all RPCs have finished/aborted
Oleg Drokin6f789a62016-02-24 22:00:29 -0500218 * to let all busy contexts be released.
219 */
Peng Taod7e09d02013-05-02 16:46:55 +0800220 class_import_get(imp);
221 class_destroy_import(imp);
222 sptlrpc_import_sec_put(imp);
223 class_import_put(imp);
224}
225EXPORT_SYMBOL(client_destroy_import);
226
Peng Taod7e09d02013-05-02 16:46:55 +0800227/* Configure an RPC client OBD device.
228 *
229 * lcfg parameters:
230 * 1 - client UUID
231 * 2 - server UUID
232 * 3 - inactive-on-startup
233 */
234int client_obd_setup(struct obd_device *obddev, struct lustre_cfg *lcfg)
235{
236 struct client_obd *cli = &obddev->u.cli;
237 struct obd_import *imp;
238 struct obd_uuid server_uuid;
239 int rq_portal, rp_portal, connect_op;
240 char *name = obddev->obd_type->typ_name;
Oleg Drokin87ba6eb2016-02-24 22:00:04 -0500241 enum ldlm_ns_type ns_type = LDLM_NS_TYPE_UNKNOWN;
Peng Taod7e09d02013-05-02 16:46:55 +0800242 int rc;
Peng Taod7e09d02013-05-02 16:46:55 +0800243
244 /* In a more perfect world, we would hang a ptlrpc_client off of
Oleg Drokin6f789a62016-02-24 22:00:29 -0500245 * obd_type and just use the values from there.
246 */
Mikhail Pershina3310522014-09-08 21:41:27 -0400247 if (!strcmp(name, LUSTRE_OSC_NAME)) {
Peng Taod7e09d02013-05-02 16:46:55 +0800248 rq_portal = OST_REQUEST_PORTAL;
249 rp_portal = OSC_REPLY_PORTAL;
250 connect_op = OST_CONNECT;
251 cli->cl_sp_me = LUSTRE_SP_CLI;
252 cli->cl_sp_to = LUSTRE_SP_OST;
253 ns_type = LDLM_NS_TYPE_OSC;
254 } else if (!strcmp(name, LUSTRE_MDC_NAME) ||
Mikhail Pershina3310522014-09-08 21:41:27 -0400255 !strcmp(name, LUSTRE_LWP_NAME)) {
Peng Taod7e09d02013-05-02 16:46:55 +0800256 rq_portal = MDS_REQUEST_PORTAL;
257 rp_portal = MDC_REPLY_PORTAL;
258 connect_op = MDS_CONNECT;
259 cli->cl_sp_me = LUSTRE_SP_CLI;
260 cli->cl_sp_to = LUSTRE_SP_MDT;
261 ns_type = LDLM_NS_TYPE_MDC;
262 } else if (!strcmp(name, LUSTRE_MGC_NAME)) {
263 rq_portal = MGS_REQUEST_PORTAL;
264 rp_portal = MGC_REPLY_PORTAL;
265 connect_op = MGS_CONNECT;
266 cli->cl_sp_me = LUSTRE_SP_MGC;
267 cli->cl_sp_to = LUSTRE_SP_MGS;
268 cli->cl_flvr_mgc.sf_rpc = SPTLRPC_FLVR_INVALID;
269 ns_type = LDLM_NS_TYPE_MGC;
270 } else {
271 CERROR("unknown client OBD type \"%s\", can't setup\n",
272 name);
Greg Kroah-Hartman0a3bdb02013-08-03 10:35:28 +0800273 return -EINVAL;
Peng Taod7e09d02013-05-02 16:46:55 +0800274 }
275
276 if (LUSTRE_CFG_BUFLEN(lcfg, 1) < 1) {
277 CERROR("requires a TARGET UUID\n");
Greg Kroah-Hartman0a3bdb02013-08-03 10:35:28 +0800278 return -EINVAL;
Peng Taod7e09d02013-05-02 16:46:55 +0800279 }
280
281 if (LUSTRE_CFG_BUFLEN(lcfg, 1) > 37) {
282 CERROR("client UUID must be less than 38 characters\n");
Greg Kroah-Hartman0a3bdb02013-08-03 10:35:28 +0800283 return -EINVAL;
Peng Taod7e09d02013-05-02 16:46:55 +0800284 }
285
286 if (LUSTRE_CFG_BUFLEN(lcfg, 2) < 1) {
287 CERROR("setup requires a SERVER UUID\n");
Greg Kroah-Hartman0a3bdb02013-08-03 10:35:28 +0800288 return -EINVAL;
Peng Taod7e09d02013-05-02 16:46:55 +0800289 }
290
291 if (LUSTRE_CFG_BUFLEN(lcfg, 2) > 37) {
292 CERROR("target UUID must be less than 38 characters\n");
Greg Kroah-Hartman0a3bdb02013-08-03 10:35:28 +0800293 return -EINVAL;
Peng Taod7e09d02013-05-02 16:46:55 +0800294 }
295
296 init_rwsem(&cli->cl_sem);
Peng Taod7e09d02013-05-02 16:46:55 +0800297 cli->cl_conn_count = 0;
298 memcpy(server_uuid.uuid, lustre_cfg_buf(lcfg, 2),
299 min_t(unsigned int, LUSTRE_CFG_BUFLEN(lcfg, 2),
300 sizeof(server_uuid)));
301
Hongchao Zhang3147b262016-08-16 16:19:22 -0400302 cli->cl_dirty_pages = 0;
Peng Taod7e09d02013-05-02 16:46:55 +0800303 cli->cl_avail_grant = 0;
Hongchao Zhang3147b262016-08-16 16:19:22 -0400304 /* FIXME: Should limit this for the sum of all cl_dirty_max_pages. */
305 /*
306 * cl_dirty_max_pages may be changed at connect time in
307 * ptlrpc_connect_interpret().
308 */
309 client_adjust_max_dirty(cli);
Peng Taod7e09d02013-05-02 16:46:55 +0800310 INIT_LIST_HEAD(&cli->cl_cache_waiters);
311 INIT_LIST_HEAD(&cli->cl_loi_ready_list);
312 INIT_LIST_HEAD(&cli->cl_loi_hp_ready_list);
313 INIT_LIST_HEAD(&cli->cl_loi_write_list);
314 INIT_LIST_HEAD(&cli->cl_loi_read_list);
John L. Hammond7d53d8f2016-03-30 19:48:36 -0400315 spin_lock_init(&cli->cl_loi_list_lock);
Peng Taod7e09d02013-05-02 16:46:55 +0800316 atomic_set(&cli->cl_pending_w_pages, 0);
317 atomic_set(&cli->cl_pending_r_pages, 0);
318 cli->cl_r_in_flight = 0;
319 cli->cl_w_in_flight = 0;
320
321 spin_lock_init(&cli->cl_read_rpc_hist.oh_lock);
322 spin_lock_init(&cli->cl_write_rpc_hist.oh_lock);
323 spin_lock_init(&cli->cl_read_page_hist.oh_lock);
324 spin_lock_init(&cli->cl_write_page_hist.oh_lock);
325 spin_lock_init(&cli->cl_read_offset_hist.oh_lock);
326 spin_lock_init(&cli->cl_write_offset_hist.oh_lock);
327
328 /* lru for osc. */
329 INIT_LIST_HEAD(&cli->cl_lru_osc);
330 atomic_set(&cli->cl_lru_shrinkers, 0);
Stephen Champion29c877a2016-09-18 16:37:43 -0400331 atomic_long_set(&cli->cl_lru_busy, 0);
332 atomic_long_set(&cli->cl_lru_in_list, 0);
Peng Taod7e09d02013-05-02 16:46:55 +0800333 INIT_LIST_HEAD(&cli->cl_lru_list);
John L. Hammond7d53d8f2016-03-30 19:48:36 -0400334 spin_lock_init(&cli->cl_lru_list_lock);
Stephen Champion29c877a2016-09-18 16:37:43 -0400335 atomic_long_set(&cli->cl_unstable_count, 0);
Peng Taod7e09d02013-05-02 16:46:55 +0800336
337 init_waitqueue_head(&cli->cl_destroy_waitq);
338 atomic_set(&cli->cl_destroy_in_flight, 0);
339 /* Turn on checksumming by default. */
340 cli->cl_checksum = 1;
341 /*
342 * The supported checksum types will be worked out at connect time
343 * Set cl_chksum* to CRC32 for now to avoid returning screwed info
344 * through procfs.
345 */
Nathaniel Clark95c9c002016-06-09 22:35:13 -0400346 cli->cl_cksum_type = OBD_CKSUM_CRC32;
347 cli->cl_supp_cksum_types = OBD_CKSUM_CRC32;
Peng Taod7e09d02013-05-02 16:46:55 +0800348 atomic_set(&cli->cl_resends, OSC_DEFAULT_RESENDS);
349
350 /* This value may be reduced at connect time in
351 * ptlrpc_connect_interpret() . We initialize it to only
352 * 1MB until we know what the performance looks like.
Oleg Drokin6f789a62016-02-24 22:00:29 -0500353 * In the future this should likely be increased. LU-1431
354 */
Peng Taod7e09d02013-05-02 16:46:55 +0800355 cli->cl_max_pages_per_rpc = min_t(int, PTLRPC_MAX_BRW_PAGES,
Kirill A. Shutemov09cbfea2016-04-01 15:29:47 +0300356 LNET_MTU >> PAGE_SHIFT);
Peng Taod7e09d02013-05-02 16:46:55 +0800357
Sebastien Buisson6f6c8e72016-04-28 12:07:35 -0400358 /*
359 * set cl_chunkbits default value to PAGE_CACHE_SHIFT,
360 * it will be updated at OSC connection time.
361 */
362 cli->cl_chunkbits = PAGE_SHIFT;
363
Peng Taod7e09d02013-05-02 16:46:55 +0800364 if (!strcmp(name, LUSTRE_MDC_NAME)) {
Fan Yong1d5d5ec2016-08-16 16:18:48 -0400365 cli->cl_max_rpcs_in_flight = OBD_MAX_RIF_DEFAULT;
Kirill A. Shutemov09cbfea2016-04-01 15:29:47 +0300366 } else if (totalram_pages >> (20 - PAGE_SHIFT) <= 128 /* MB */) {
Peng Taod7e09d02013-05-02 16:46:55 +0800367 cli->cl_max_rpcs_in_flight = 2;
Kirill A. Shutemov09cbfea2016-04-01 15:29:47 +0300368 } else if (totalram_pages >> (20 - PAGE_SHIFT) <= 256 /* MB */) {
Peng Taod7e09d02013-05-02 16:46:55 +0800369 cli->cl_max_rpcs_in_flight = 3;
Kirill A. Shutemov09cbfea2016-04-01 15:29:47 +0300370 } else if (totalram_pages >> (20 - PAGE_SHIFT) <= 512 /* MB */) {
Peng Taod7e09d02013-05-02 16:46:55 +0800371 cli->cl_max_rpcs_in_flight = 4;
372 } else {
Fan Yong1d5d5ec2016-08-16 16:18:48 -0400373 cli->cl_max_rpcs_in_flight = OBD_MAX_RIF_DEFAULT;
Peng Taod7e09d02013-05-02 16:46:55 +0800374 }
375 rc = ldlm_get_ref();
376 if (rc) {
377 CERROR("ldlm_get_ref failed: %d\n", rc);
Julia Lawalld1c0d442014-09-01 22:21:09 +0200378 goto err;
Peng Taod7e09d02013-05-02 16:46:55 +0800379 }
380
381 ptlrpc_init_client(rq_portal, rp_portal, name,
382 &obddev->obd_ldlm_client);
383
384 imp = class_new_import(obddev);
Oleg Drokin44b53f12016-02-16 00:46:47 -0500385 if (!imp) {
Julia Lawalld1c0d442014-09-01 22:21:09 +0200386 rc = -ENOENT;
387 goto err_ldlm;
388 }
Peng Taod7e09d02013-05-02 16:46:55 +0800389 imp->imp_client = &obddev->obd_ldlm_client;
390 imp->imp_connect_op = connect_op;
391 memcpy(cli->cl_target_uuid.uuid, lustre_cfg_buf(lcfg, 1),
392 LUSTRE_CFG_BUFLEN(lcfg, 1));
393 class_import_put(imp);
394
395 rc = client_import_add_conn(imp, &server_uuid, 1);
396 if (rc) {
397 CERROR("can't add initial connection\n");
Julia Lawalld1c0d442014-09-01 22:21:09 +0200398 goto err_import;
Peng Taod7e09d02013-05-02 16:46:55 +0800399 }
400
401 cli->cl_import = imp;
402 /* cli->cl_max_mds_{easize,cookiesize} updated by mdc_init_ea_size() */
403 cli->cl_max_mds_easize = sizeof(struct lov_mds_md_v3);
404 cli->cl_max_mds_cookiesize = sizeof(struct llog_cookie);
405
406 if (LUSTRE_CFG_BUFLEN(lcfg, 3) > 0) {
407 if (!strcmp(lustre_cfg_string(lcfg, 3), "inactive")) {
408 CDEBUG(D_HA, "marking %s %s->%s as inactive\n",
409 name, obddev->obd_name,
410 cli->cl_target_uuid.uuid);
411 spin_lock(&imp->imp_lock);
412 imp->imp_deactive = 1;
413 spin_unlock(&imp->imp_lock);
414 }
415 }
416
417 obddev->obd_namespace = ldlm_namespace_new(obddev, obddev->obd_name,
418 LDLM_NAMESPACE_CLIENT,
419 LDLM_NAMESPACE_GREEDY,
420 ns_type);
Oleg Drokin44b53f12016-02-16 00:46:47 -0500421 if (!obddev->obd_namespace) {
Peng Taod7e09d02013-05-02 16:46:55 +0800422 CERROR("Unable to create client namespace - %s\n",
423 obddev->obd_name);
Julia Lawalld1c0d442014-09-01 22:21:09 +0200424 rc = -ENOMEM;
425 goto err_import;
Peng Taod7e09d02013-05-02 16:46:55 +0800426 }
427
428 cli->cl_qchk_stat = CL_NOT_QUOTACHECKED;
429
Greg Kroah-Hartman0a3bdb02013-08-03 10:35:28 +0800430 return rc;
Peng Taod7e09d02013-05-02 16:46:55 +0800431
432err_import:
433 class_destroy_import(imp);
434err_ldlm:
435 ldlm_put_ref();
436err:
Greg Kroah-Hartman0a3bdb02013-08-03 10:35:28 +0800437 return rc;
Peng Taod7e09d02013-05-02 16:46:55 +0800438}
439EXPORT_SYMBOL(client_obd_setup);
440
441int client_obd_cleanup(struct obd_device *obddev)
442{
Peng Taod7e09d02013-05-02 16:46:55 +0800443 ldlm_namespace_free_post(obddev->obd_namespace);
444 obddev->obd_namespace = NULL;
445
Swapnil Pimpaled8555062016-04-27 21:37:14 -0400446 obd_cleanup_client_import(obddev);
Oleg Drokin44b53f12016-02-16 00:46:47 -0500447 LASSERT(!obddev->u.cli.cl_import);
Peng Taod7e09d02013-05-02 16:46:55 +0800448
449 ldlm_put_ref();
Greg Kroah-Hartman0a3bdb02013-08-03 10:35:28 +0800450 return 0;
Peng Taod7e09d02013-05-02 16:46:55 +0800451}
452EXPORT_SYMBOL(client_obd_cleanup);
453
454/* ->o_connect() method for client side (OSC and MDC and MGC) */
455int client_connect_import(const struct lu_env *env,
456 struct obd_export **exp,
457 struct obd_device *obd, struct obd_uuid *cluuid,
458 struct obd_connect_data *data, void *localdata)
459{
460 struct client_obd *cli = &obd->u.cli;
461 struct obd_import *imp = cli->cl_import;
462 struct obd_connect_data *ocd;
463 struct lustre_handle conn = { 0 };
464 int rc;
Peng Taod7e09d02013-05-02 16:46:55 +0800465
466 *exp = NULL;
467 down_write(&cli->cl_sem);
Julia Lawalld1c0d442014-09-01 22:21:09 +0200468 if (cli->cl_conn_count > 0) {
469 rc = -EALREADY;
470 goto out_sem;
471 }
Peng Taod7e09d02013-05-02 16:46:55 +0800472
473 rc = class_connect(&conn, obd, cluuid);
474 if (rc)
Julia Lawalld1c0d442014-09-01 22:21:09 +0200475 goto out_sem;
Peng Taod7e09d02013-05-02 16:46:55 +0800476
477 cli->cl_conn_count++;
478 *exp = class_conn2export(&conn);
479
480 LASSERT(obd->obd_namespace);
481
482 imp->imp_dlm_handle = conn;
483 rc = ptlrpc_init_import(imp);
484 if (rc != 0)
Julia Lawalld1c0d442014-09-01 22:21:09 +0200485 goto out_ldlm;
Peng Taod7e09d02013-05-02 16:46:55 +0800486
487 ocd = &imp->imp_connect_data;
488 if (data) {
489 *ocd = *data;
490 imp->imp_connect_flags_orig = data->ocd_connect_flags;
491 }
492
493 rc = ptlrpc_connect_import(imp);
494 if (rc != 0) {
Anil Belur05dca372014-06-20 02:01:48 +1000495 LASSERT(imp->imp_state == LUSTRE_IMP_DISCON);
Julia Lawalld1c0d442014-09-01 22:21:09 +0200496 goto out_ldlm;
Peng Taod7e09d02013-05-02 16:46:55 +0800497 }
Oleg Drokin44b53f12016-02-16 00:46:47 -0500498 LASSERT(*exp && (*exp)->exp_connection);
Peng Taod7e09d02013-05-02 16:46:55 +0800499
500 if (data) {
501 LASSERTF((ocd->ocd_connect_flags & data->ocd_connect_flags) ==
Greg Kroah-Hartman55f5a822014-07-12 20:26:07 -0700502 ocd->ocd_connect_flags, "old %#llx, new %#llx\n",
Peng Taod7e09d02013-05-02 16:46:55 +0800503 data->ocd_connect_flags, ocd->ocd_connect_flags);
504 data->ocd_connect_flags = ocd->ocd_connect_flags;
505 }
506
507 ptlrpc_pinger_add_import(imp);
508
Peng Taod7e09d02013-05-02 16:46:55 +0800509 if (rc) {
510out_ldlm:
511 cli->cl_conn_count--;
512 class_disconnect(*exp);
513 *exp = NULL;
514 }
515out_sem:
516 up_write(&cli->cl_sem);
517
518 return rc;
519}
520EXPORT_SYMBOL(client_connect_import);
521
522int client_disconnect_export(struct obd_export *exp)
523{
524 struct obd_device *obd = class_exp2obd(exp);
525 struct client_obd *cli;
526 struct obd_import *imp;
527 int rc = 0, err;
Peng Taod7e09d02013-05-02 16:46:55 +0800528
529 if (!obd) {
Greg Kroah-Hartman55f5a822014-07-12 20:26:07 -0700530 CERROR("invalid export for disconnect: exp %p cookie %#llx\n",
Peng Taod7e09d02013-05-02 16:46:55 +0800531 exp, exp ? exp->exp_handle.h_cookie : -1);
Greg Kroah-Hartman0a3bdb02013-08-03 10:35:28 +0800532 return -EINVAL;
Peng Taod7e09d02013-05-02 16:46:55 +0800533 }
534
535 cli = &obd->u.cli;
536 imp = cli->cl_import;
537
538 down_write(&cli->cl_sem);
Dmitry Eremin6314ccb2016-09-18 16:38:39 -0400539 CDEBUG(D_INFO, "disconnect %s - %zu\n", obd->obd_name,
Peng Taod7e09d02013-05-02 16:46:55 +0800540 cli->cl_conn_count);
541
542 if (!cli->cl_conn_count) {
543 CERROR("disconnecting disconnected device (%s)\n",
544 obd->obd_name);
Julia Lawalld1c0d442014-09-01 22:21:09 +0200545 rc = -EINVAL;
546 goto out_disconnect;
Peng Taod7e09d02013-05-02 16:46:55 +0800547 }
548
549 cli->cl_conn_count--;
Julia Lawalld1c0d442014-09-01 22:21:09 +0200550 if (cli->cl_conn_count) {
551 rc = 0;
552 goto out_disconnect;
553 }
Peng Taod7e09d02013-05-02 16:46:55 +0800554
555 /* Mark import deactivated now, so we don't try to reconnect if any
556 * of the cleanup RPCs fails (e.g. LDLM cancel, etc). We don't
Oleg Drokin6f789a62016-02-24 22:00:29 -0500557 * fully deactivate the import, or that would drop all requests.
558 */
Peng Taod7e09d02013-05-02 16:46:55 +0800559 spin_lock(&imp->imp_lock);
560 imp->imp_deactive = 1;
561 spin_unlock(&imp->imp_lock);
562
563 /* Some non-replayable imports (MDS's OSCs) are pinged, so just
564 * delete it regardless. (It's safe to delete an import that was
Oleg Drokin6f789a62016-02-24 22:00:29 -0500565 * never added.)
566 */
Peng Taod7e09d02013-05-02 16:46:55 +0800567 (void)ptlrpc_pinger_del_import(imp);
568
Oleg Drokin44b53f12016-02-16 00:46:47 -0500569 if (obd->obd_namespace) {
Peng Taod7e09d02013-05-02 16:46:55 +0800570 /* obd_force == local only */
571 ldlm_cli_cancel_unused(obd->obd_namespace, NULL,
572 obd->obd_force ? LCF_LOCAL : 0, NULL);
Andreas Ruprechte7ddc482014-11-23 14:37:49 +0100573 ldlm_namespace_free_prior(obd->obd_namespace, imp,
574 obd->obd_force);
Peng Taod7e09d02013-05-02 16:46:55 +0800575 }
576
577 /* There's no need to hold sem while disconnecting an import,
Oleg Drokin6f789a62016-02-24 22:00:29 -0500578 * and it may actually cause deadlock in GSS.
579 */
Peng Taod7e09d02013-05-02 16:46:55 +0800580 up_write(&cli->cl_sem);
581 rc = ptlrpc_disconnect_import(imp, 0);
582 down_write(&cli->cl_sem);
583
584 ptlrpc_invalidate_import(imp);
585
Peng Taod7e09d02013-05-02 16:46:55 +0800586out_disconnect:
587 /* Use server style - class_disconnect should be always called for
Oleg Drokin6f789a62016-02-24 22:00:29 -0500588 * o_disconnect.
589 */
Peng Taod7e09d02013-05-02 16:46:55 +0800590 err = class_disconnect(exp);
591 if (!rc && err)
592 rc = err;
593
594 up_write(&cli->cl_sem);
595
Greg Kroah-Hartman0a3bdb02013-08-03 10:35:28 +0800596 return rc;
Peng Taod7e09d02013-05-02 16:46:55 +0800597}
598EXPORT_SYMBOL(client_disconnect_export);
599
Peng Taod7e09d02013-05-02 16:46:55 +0800600/**
601 * Packs current SLV and Limit into \a req.
602 */
603int target_pack_pool_reply(struct ptlrpc_request *req)
604{
605 struct obd_device *obd;
Peng Taod7e09d02013-05-02 16:46:55 +0800606
607 /* Check that we still have all structures alive as this may
Oleg Drokin6f789a62016-02-24 22:00:29 -0500608 * be some late RPC at shutdown time.
609 */
Peng Taod7e09d02013-05-02 16:46:55 +0800610 if (unlikely(!req->rq_export || !req->rq_export->exp_obd ||
611 !exp_connect_lru_resize(req->rq_export))) {
612 lustre_msg_set_slv(req->rq_repmsg, 0);
613 lustre_msg_set_limit(req->rq_repmsg, 0);
Greg Kroah-Hartman0a3bdb02013-08-03 10:35:28 +0800614 return 0;
Peng Taod7e09d02013-05-02 16:46:55 +0800615 }
616
617 /* OBD is alive here as export is alive, which we checked above. */
618 obd = req->rq_export->exp_obd;
619
620 read_lock(&obd->obd_pool_lock);
621 lustre_msg_set_slv(req->rq_repmsg, obd->obd_pool_slv);
622 lustre_msg_set_limit(req->rq_repmsg, obd->obd_pool_limit);
623 read_unlock(&obd->obd_pool_lock);
624
Greg Kroah-Hartman0a3bdb02013-08-03 10:35:28 +0800625 return 0;
Peng Taod7e09d02013-05-02 16:46:55 +0800626}
627EXPORT_SYMBOL(target_pack_pool_reply);
628
Cihangir Akturk3377bad2015-07-21 10:22:52 +0300629static int
630target_send_reply_msg(struct ptlrpc_request *req, int rc, int fail_id)
Peng Taod7e09d02013-05-02 16:46:55 +0800631{
632 if (OBD_FAIL_CHECK_ORSET(fail_id & ~OBD_FAIL_ONCE, OBD_FAIL_ONCE)) {
633 DEBUG_REQ(D_ERROR, req, "dropping reply");
Julia Lawallfbe7c6c2014-08-26 22:00:33 +0200634 return -ECOMM;
Peng Taod7e09d02013-05-02 16:46:55 +0800635 }
636
637 if (unlikely(rc)) {
638 DEBUG_REQ(D_NET, req, "processing error (%d)", rc);
639 req->rq_status = rc;
Julia Lawallfbe7c6c2014-08-26 22:00:33 +0200640 return ptlrpc_send_error(req, 1);
Peng Taod7e09d02013-05-02 16:46:55 +0800641 }
642
Antonio Murdaca71e8dd92015-06-08 21:48:41 +0200643 DEBUG_REQ(D_NET, req, "sending reply");
Julia Lawallfbe7c6c2014-08-26 22:00:33 +0200644 return ptlrpc_send_reply(req, PTLRPC_REPLY_MAYBE_DIFFICULT);
Peng Taod7e09d02013-05-02 16:46:55 +0800645}
646
647void target_send_reply(struct ptlrpc_request *req, int rc, int fail_id)
648{
649 struct ptlrpc_service_part *svcpt;
650 int netrc;
651 struct ptlrpc_reply_state *rs;
652 struct obd_export *exp;
Peng Taod7e09d02013-05-02 16:46:55 +0800653
Anil Belurb7cfd6d2014-06-20 02:01:47 +1000654 if (req->rq_no_reply)
Peng Taod7e09d02013-05-02 16:46:55 +0800655 return;
Peng Taod7e09d02013-05-02 16:46:55 +0800656
657 svcpt = req->rq_rqbd->rqbd_svcpt;
658 rs = req->rq_reply_state;
Oleg Drokin44b53f12016-02-16 00:46:47 -0500659 if (!rs || !rs->rs_difficult) {
Peng Taod7e09d02013-05-02 16:46:55 +0800660 /* no notifiers */
Anil Belur05dca372014-06-20 02:01:48 +1000661 target_send_reply_msg(req, rc, fail_id);
Peng Taod7e09d02013-05-02 16:46:55 +0800662 return;
663 }
664
665 /* must be an export if locks saved */
Oleg Drokin44b53f12016-02-16 00:46:47 -0500666 LASSERT(req->rq_export);
Peng Taod7e09d02013-05-02 16:46:55 +0800667 /* req/reply consistent */
668 LASSERT(rs->rs_svcpt == svcpt);
669
670 /* "fresh" reply */
Anil Belur05dca372014-06-20 02:01:48 +1000671 LASSERT(!rs->rs_scheduled);
672 LASSERT(!rs->rs_scheduled_ever);
673 LASSERT(!rs->rs_handled);
674 LASSERT(!rs->rs_on_net);
Oleg Drokin44b53f12016-02-16 00:46:47 -0500675 LASSERT(!rs->rs_export);
Anil Belur05dca372014-06-20 02:01:48 +1000676 LASSERT(list_empty(&rs->rs_obd_list));
677 LASSERT(list_empty(&rs->rs_exp_list));
Peng Taod7e09d02013-05-02 16:46:55 +0800678
Anil Belur05dca372014-06-20 02:01:48 +1000679 exp = class_export_get(req->rq_export);
Peng Taod7e09d02013-05-02 16:46:55 +0800680
681 /* disable reply scheduling while I'm setting up */
682 rs->rs_scheduled = 1;
683 rs->rs_on_net = 1;
684 rs->rs_xid = req->rq_xid;
685 rs->rs_transno = req->rq_transno;
686 rs->rs_export = exp;
687 rs->rs_opc = lustre_msg_get_opc(req->rq_reqmsg);
688
689 spin_lock(&exp->exp_uncommitted_replies_lock);
Greg Kroah-Hartmanb0f5aad2014-07-12 20:06:04 -0700690 CDEBUG(D_NET, "rs transno = %llu, last committed = %llu\n",
Peng Taod7e09d02013-05-02 16:46:55 +0800691 rs->rs_transno, exp->exp_last_committed);
692 if (rs->rs_transno > exp->exp_last_committed) {
693 /* not committed already */
694 list_add_tail(&rs->rs_obd_list,
Oleg Drokin24c198e2016-08-21 18:04:35 -0400695 &exp->exp_uncommitted_replies);
Peng Taod7e09d02013-05-02 16:46:55 +0800696 }
697 spin_unlock(&exp->exp_uncommitted_replies_lock);
698
699 spin_lock(&exp->exp_lock);
700 list_add_tail(&rs->rs_exp_list, &exp->exp_outstanding_replies);
701 spin_unlock(&exp->exp_lock);
702
703 netrc = target_send_reply_msg(req, rc, fail_id);
704
705 spin_lock(&svcpt->scp_rep_lock);
706
707 atomic_inc(&svcpt->scp_nreps_difficult);
708
709 if (netrc != 0) {
710 /* error sending: reply is off the net. Also we need +1
711 * reply ref until ptlrpc_handle_rs() is done
712 * with the reply state (if the send was successful, there
713 * would have been +1 ref for the net, which
Oleg Drokin6f789a62016-02-24 22:00:29 -0500714 * reply_out_callback leaves alone)
715 */
Peng Taod7e09d02013-05-02 16:46:55 +0800716 rs->rs_on_net = 0;
717 ptlrpc_rs_addref(rs);
718 }
719
720 spin_lock(&rs->rs_lock);
721 if (rs->rs_transno <= exp->exp_last_committed ||
722 (!rs->rs_on_net && !rs->rs_no_ack) ||
723 list_empty(&rs->rs_exp_list) || /* completed already */
724 list_empty(&rs->rs_obd_list)) {
725 CDEBUG(D_HA, "Schedule reply immediately\n");
726 ptlrpc_dispatch_difficult_reply(rs);
727 } else {
728 list_add(&rs->rs_list, &svcpt->scp_rep_active);
729 rs->rs_scheduled = 0; /* allow notifier to schedule */
730 }
731 spin_unlock(&rs->rs_lock);
732 spin_unlock(&svcpt->scp_rep_lock);
Peng Taod7e09d02013-05-02 16:46:55 +0800733}
734EXPORT_SYMBOL(target_send_reply);
735
Oleg Drokin52ee0d22016-02-24 21:59:54 -0500736enum ldlm_mode lck_compat_array[] = {
Emil Goode805e5172013-07-28 00:38:56 +0200737 [LCK_EX] = LCK_COMPAT_EX,
738 [LCK_PW] = LCK_COMPAT_PW,
739 [LCK_PR] = LCK_COMPAT_PR,
740 [LCK_CW] = LCK_COMPAT_CW,
741 [LCK_CR] = LCK_COMPAT_CR,
742 [LCK_NL] = LCK_COMPAT_NL,
743 [LCK_GROUP] = LCK_COMPAT_GROUP,
744 [LCK_COS] = LCK_COMPAT_COS,
Peng Taod7e09d02013-05-02 16:46:55 +0800745};
746
747/**
748 * Rather arbitrary mapping from LDLM error codes to errno values. This should
749 * not escape to the user level.
750 */
Oleg Drokind1777aa2016-02-24 22:00:02 -0500751int ldlm_error2errno(enum ldlm_error error)
Peng Taod7e09d02013-05-02 16:46:55 +0800752{
753 int result;
754
755 switch (error) {
756 case ELDLM_OK:
Jinshan Xiong06563b52016-03-30 19:48:40 -0400757 case ELDLM_LOCK_MATCHED:
Peng Taod7e09d02013-05-02 16:46:55 +0800758 result = 0;
759 break;
760 case ELDLM_LOCK_CHANGED:
761 result = -ESTALE;
762 break;
763 case ELDLM_LOCK_ABORTED:
764 result = -ENAVAIL;
765 break;
766 case ELDLM_LOCK_REPLACED:
767 result = -ESRCH;
768 break;
769 case ELDLM_NO_LOCK_DATA:
770 result = -ENOENT;
771 break;
772 case ELDLM_NAMESPACE_EXISTS:
773 result = -EEXIST;
774 break;
775 case ELDLM_BAD_NAMESPACE:
776 result = -EBADF;
777 break;
778 default:
779 if (((int)error) < 0) /* cast to signed type */
Oleg Drokind1777aa2016-02-24 22:00:02 -0500780 result = error; /* as enum ldlm_error can be unsigned */
Peng Taod7e09d02013-05-02 16:46:55 +0800781 else {
782 CERROR("Invalid DLM result code: %d\n", error);
783 result = -EPROTO;
784 }
785 }
786 return result;
787}
788EXPORT_SYMBOL(ldlm_error2errno);
789
Peng Taod7e09d02013-05-02 16:46:55 +0800790#if LUSTRE_TRACKS_LOCK_EXP_REFS
791void ldlm_dump_export_locks(struct obd_export *exp)
792{
793 spin_lock(&exp->exp_locks_list_guard);
794 if (!list_empty(&exp->exp_locks_list)) {
795 struct ldlm_lock *lock;
796
Joe Perches2d00bd12014-11-23 11:28:50 -0800797 CERROR("dumping locks for export %p,ignore if the unmount doesn't hang\n",
798 exp);
Peng Taod7e09d02013-05-02 16:46:55 +0800799 list_for_each_entry(lock, &exp->exp_locks_list,
Oleg Drokin24c198e2016-08-21 18:04:35 -0400800 l_exp_refs_link)
Peng Taod7e09d02013-05-02 16:46:55 +0800801 LDLM_ERROR(lock, "lock:");
802 }
803 spin_unlock(&exp->exp_locks_list_guard);
804}
805#endif