blob: 65008d79c96d2e651091dbd7bcbe47f1e17221ec [file] [log] [blame]
David Teiglande7fd4172006-01-18 09:30:29 +00001/******************************************************************************
2*******************************************************************************
3**
4** Copyright (C) 2005 Red Hat, Inc. All rights reserved.
5**
6** This copyrighted material is made available to anyone wishing to use,
7** modify, copy, or redistribute it subject to the terms and conditions
8** of the GNU General Public License v.2.
9**
10*******************************************************************************
11******************************************************************************/
12
13#include "dlm_internal.h"
14#include "member.h"
15#include "lock.h"
16#include "dir.h"
17#include "config.h"
18#include "requestqueue.h"
19
20struct rq_entry {
21 struct list_head list;
22 int nodeid;
23 char request[1];
24};
25
26/*
27 * Requests received while the lockspace is in recovery get added to the
28 * request queue and processed when recovery is complete. This happens when
29 * the lockspace is suspended on some nodes before it is on others, or the
30 * lockspace is enabled on some while still suspended on others.
31 */
32
David Teiglandd4400152006-10-31 11:55:56 -060033int dlm_add_requestqueue(struct dlm_ls *ls, int nodeid, struct dlm_header *hd)
David Teiglande7fd4172006-01-18 09:30:29 +000034{
35 struct rq_entry *e;
36 int length = hd->h_length;
David Teiglandd4400152006-10-31 11:55:56 -060037 int rv = 0;
David Teiglande7fd4172006-01-18 09:30:29 +000038
David Teiglande7fd4172006-01-18 09:30:29 +000039 e = kmalloc(sizeof(struct rq_entry) + length, GFP_KERNEL);
40 if (!e) {
41 log_print("dlm_add_requestqueue: out of memory\n");
David Teiglandd4400152006-10-31 11:55:56 -060042 return 0;
David Teiglande7fd4172006-01-18 09:30:29 +000043 }
44
45 e->nodeid = nodeid;
46 memcpy(e->request, hd, length);
47
David Teiglandd4400152006-10-31 11:55:56 -060048 /* We need to check dlm_locking_stopped() after taking the mutex to
49 avoid a race where dlm_recoverd enables locking and runs
50 process_requestqueue between our earlier dlm_locking_stopped check
51 and this addition to the requestqueue. */
52
David Teigland90135922006-01-20 08:47:07 +000053 mutex_lock(&ls->ls_requestqueue_mutex);
David Teiglandd4400152006-10-31 11:55:56 -060054 if (dlm_locking_stopped(ls))
55 list_add_tail(&e->list, &ls->ls_requestqueue);
56 else {
57 log_debug(ls, "dlm_add_requestqueue skip from %d", nodeid);
58 kfree(e);
59 rv = -EAGAIN;
60 }
David Teigland90135922006-01-20 08:47:07 +000061 mutex_unlock(&ls->ls_requestqueue_mutex);
David Teiglandd4400152006-10-31 11:55:56 -060062 return rv;
David Teiglande7fd4172006-01-18 09:30:29 +000063}
64
65int dlm_process_requestqueue(struct dlm_ls *ls)
66{
67 struct rq_entry *e;
68 struct dlm_header *hd;
69 int error = 0;
70
David Teigland90135922006-01-20 08:47:07 +000071 mutex_lock(&ls->ls_requestqueue_mutex);
David Teiglande7fd4172006-01-18 09:30:29 +000072
73 for (;;) {
74 if (list_empty(&ls->ls_requestqueue)) {
David Teigland90135922006-01-20 08:47:07 +000075 mutex_unlock(&ls->ls_requestqueue_mutex);
David Teiglande7fd4172006-01-18 09:30:29 +000076 error = 0;
77 break;
78 }
79 e = list_entry(ls->ls_requestqueue.next, struct rq_entry, list);
David Teigland90135922006-01-20 08:47:07 +000080 mutex_unlock(&ls->ls_requestqueue_mutex);
David Teiglande7fd4172006-01-18 09:30:29 +000081
82 hd = (struct dlm_header *) e->request;
David Teigland90135922006-01-20 08:47:07 +000083 error = dlm_receive_message(hd, e->nodeid, 1);
David Teiglande7fd4172006-01-18 09:30:29 +000084
85 if (error == -EINTR) {
86 /* entry is left on requestqueue */
87 log_debug(ls, "process_requestqueue abort eintr");
88 break;
89 }
90
David Teigland90135922006-01-20 08:47:07 +000091 mutex_lock(&ls->ls_requestqueue_mutex);
David Teiglande7fd4172006-01-18 09:30:29 +000092 list_del(&e->list);
93 kfree(e);
94
95 if (dlm_locking_stopped(ls)) {
96 log_debug(ls, "process_requestqueue abort running");
David Teigland90135922006-01-20 08:47:07 +000097 mutex_unlock(&ls->ls_requestqueue_mutex);
David Teiglande7fd4172006-01-18 09:30:29 +000098 error = -EINTR;
99 break;
100 }
101 schedule();
102 }
103
104 return error;
105}
106
107/*
108 * After recovery is done, locking is resumed and dlm_recoverd takes all the
109 * saved requests and processes them as they would have been by dlm_recvd. At
110 * the same time, dlm_recvd will start receiving new requests from remote
111 * nodes. We want to delay dlm_recvd processing new requests until
112 * dlm_recoverd has finished processing the old saved requests.
113 */
114
115void dlm_wait_requestqueue(struct dlm_ls *ls)
116{
117 for (;;) {
David Teigland90135922006-01-20 08:47:07 +0000118 mutex_lock(&ls->ls_requestqueue_mutex);
David Teiglande7fd4172006-01-18 09:30:29 +0000119 if (list_empty(&ls->ls_requestqueue))
120 break;
121 if (dlm_locking_stopped(ls))
122 break;
David Teigland90135922006-01-20 08:47:07 +0000123 mutex_unlock(&ls->ls_requestqueue_mutex);
David Teiglande7fd4172006-01-18 09:30:29 +0000124 schedule();
125 }
David Teigland90135922006-01-20 08:47:07 +0000126 mutex_unlock(&ls->ls_requestqueue_mutex);
David Teiglande7fd4172006-01-18 09:30:29 +0000127}
128
129static int purge_request(struct dlm_ls *ls, struct dlm_message *ms, int nodeid)
130{
131 uint32_t type = ms->m_type;
132
David Teigland2896ee32006-11-27 11:31:22 -0600133 /* the ls is being cleaned up and freed by release_lockspace */
134 if (!ls->ls_count)
135 return 1;
136
David Teiglande7fd4172006-01-18 09:30:29 +0000137 if (dlm_is_removed(ls, nodeid))
138 return 1;
139
140 /* directory operations are always purged because the directory is
141 always rebuilt during recovery and the lookups resent */
142
143 if (type == DLM_MSG_REMOVE ||
144 type == DLM_MSG_LOOKUP ||
145 type == DLM_MSG_LOOKUP_REPLY)
146 return 1;
147
148 if (!dlm_no_directory(ls))
149 return 0;
150
151 /* with no directory, the master is likely to change as a part of
152 recovery; requests to/from the defunct master need to be purged */
153
154 switch (type) {
155 case DLM_MSG_REQUEST:
156 case DLM_MSG_CONVERT:
157 case DLM_MSG_UNLOCK:
158 case DLM_MSG_CANCEL:
159 /* we're no longer the master of this resource, the sender
160 will resend to the new master (see waiter_needs_recovery) */
161
162 if (dlm_hash2nodeid(ls, ms->m_hash) != dlm_our_nodeid())
163 return 1;
164 break;
165
166 case DLM_MSG_REQUEST_REPLY:
167 case DLM_MSG_CONVERT_REPLY:
168 case DLM_MSG_UNLOCK_REPLY:
169 case DLM_MSG_CANCEL_REPLY:
170 case DLM_MSG_GRANT:
171 /* this reply is from the former master of the resource,
172 we'll resend to the new master if needed */
173
174 if (dlm_hash2nodeid(ls, ms->m_hash) != nodeid)
175 return 1;
176 break;
177 }
178
179 return 0;
180}
181
182void dlm_purge_requestqueue(struct dlm_ls *ls)
183{
184 struct dlm_message *ms;
185 struct rq_entry *e, *safe;
186
David Teigland90135922006-01-20 08:47:07 +0000187 mutex_lock(&ls->ls_requestqueue_mutex);
David Teiglande7fd4172006-01-18 09:30:29 +0000188 list_for_each_entry_safe(e, safe, &ls->ls_requestqueue, list) {
189 ms = (struct dlm_message *) e->request;
190
191 if (purge_request(ls, ms, e->nodeid)) {
192 list_del(&e->list);
193 kfree(e);
194 }
195 }
David Teigland90135922006-01-20 08:47:07 +0000196 mutex_unlock(&ls->ls_requestqueue_mutex);
David Teiglande7fd4172006-01-18 09:30:29 +0000197}
198