1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0-only
2*4882a593Smuzhiyun /******************************************************************************
3*4882a593Smuzhiyun *******************************************************************************
4*4882a593Smuzhiyun **
5*4882a593Smuzhiyun ** Copyright (C) Sistina Software, Inc. 1997-2003 All rights reserved.
6*4882a593Smuzhiyun ** Copyright (C) 2004-2010 Red Hat, Inc. All rights reserved.
7*4882a593Smuzhiyun **
8*4882a593Smuzhiyun **
9*4882a593Smuzhiyun *******************************************************************************
10*4882a593Smuzhiyun ******************************************************************************/
11*4882a593Smuzhiyun
12*4882a593Smuzhiyun #include "dlm_internal.h"
13*4882a593Smuzhiyun #include "lock.h"
14*4882a593Smuzhiyun #include "user.h"
15*4882a593Smuzhiyun #include "ast.h"
16*4882a593Smuzhiyun
17*4882a593Smuzhiyun static uint64_t dlm_cb_seq;
18*4882a593Smuzhiyun static DEFINE_SPINLOCK(dlm_cb_seq_spin);
19*4882a593Smuzhiyun
dlm_dump_lkb_callbacks(struct dlm_lkb * lkb)20*4882a593Smuzhiyun static void dlm_dump_lkb_callbacks(struct dlm_lkb *lkb)
21*4882a593Smuzhiyun {
22*4882a593Smuzhiyun int i;
23*4882a593Smuzhiyun
24*4882a593Smuzhiyun log_print("last_bast %x %llu flags %x mode %d sb %d %x",
25*4882a593Smuzhiyun lkb->lkb_id,
26*4882a593Smuzhiyun (unsigned long long)lkb->lkb_last_bast.seq,
27*4882a593Smuzhiyun lkb->lkb_last_bast.flags,
28*4882a593Smuzhiyun lkb->lkb_last_bast.mode,
29*4882a593Smuzhiyun lkb->lkb_last_bast.sb_status,
30*4882a593Smuzhiyun lkb->lkb_last_bast.sb_flags);
31*4882a593Smuzhiyun
32*4882a593Smuzhiyun log_print("last_cast %x %llu flags %x mode %d sb %d %x",
33*4882a593Smuzhiyun lkb->lkb_id,
34*4882a593Smuzhiyun (unsigned long long)lkb->lkb_last_cast.seq,
35*4882a593Smuzhiyun lkb->lkb_last_cast.flags,
36*4882a593Smuzhiyun lkb->lkb_last_cast.mode,
37*4882a593Smuzhiyun lkb->lkb_last_cast.sb_status,
38*4882a593Smuzhiyun lkb->lkb_last_cast.sb_flags);
39*4882a593Smuzhiyun
40*4882a593Smuzhiyun for (i = 0; i < DLM_CALLBACKS_SIZE; i++) {
41*4882a593Smuzhiyun log_print("cb %x %llu flags %x mode %d sb %d %x",
42*4882a593Smuzhiyun lkb->lkb_id,
43*4882a593Smuzhiyun (unsigned long long)lkb->lkb_callbacks[i].seq,
44*4882a593Smuzhiyun lkb->lkb_callbacks[i].flags,
45*4882a593Smuzhiyun lkb->lkb_callbacks[i].mode,
46*4882a593Smuzhiyun lkb->lkb_callbacks[i].sb_status,
47*4882a593Smuzhiyun lkb->lkb_callbacks[i].sb_flags);
48*4882a593Smuzhiyun }
49*4882a593Smuzhiyun }
50*4882a593Smuzhiyun
dlm_add_lkb_callback(struct dlm_lkb * lkb,uint32_t flags,int mode,int status,uint32_t sbflags,uint64_t seq)51*4882a593Smuzhiyun int dlm_add_lkb_callback(struct dlm_lkb *lkb, uint32_t flags, int mode,
52*4882a593Smuzhiyun int status, uint32_t sbflags, uint64_t seq)
53*4882a593Smuzhiyun {
54*4882a593Smuzhiyun struct dlm_ls *ls = lkb->lkb_resource->res_ls;
55*4882a593Smuzhiyun uint64_t prev_seq;
56*4882a593Smuzhiyun int prev_mode;
57*4882a593Smuzhiyun int i, rv;
58*4882a593Smuzhiyun
59*4882a593Smuzhiyun for (i = 0; i < DLM_CALLBACKS_SIZE; i++) {
60*4882a593Smuzhiyun if (lkb->lkb_callbacks[i].seq)
61*4882a593Smuzhiyun continue;
62*4882a593Smuzhiyun
63*4882a593Smuzhiyun /*
64*4882a593Smuzhiyun * Suppress some redundant basts here, do more on removal.
65*4882a593Smuzhiyun * Don't even add a bast if the callback just before it
66*4882a593Smuzhiyun * is a bast for the same mode or a more restrictive mode.
67*4882a593Smuzhiyun * (the addional > PR check is needed for PR/CW inversion)
68*4882a593Smuzhiyun */
69*4882a593Smuzhiyun
70*4882a593Smuzhiyun if ((i > 0) && (flags & DLM_CB_BAST) &&
71*4882a593Smuzhiyun (lkb->lkb_callbacks[i-1].flags & DLM_CB_BAST)) {
72*4882a593Smuzhiyun
73*4882a593Smuzhiyun prev_seq = lkb->lkb_callbacks[i-1].seq;
74*4882a593Smuzhiyun prev_mode = lkb->lkb_callbacks[i-1].mode;
75*4882a593Smuzhiyun
76*4882a593Smuzhiyun if ((prev_mode == mode) ||
77*4882a593Smuzhiyun (prev_mode > mode && prev_mode > DLM_LOCK_PR)) {
78*4882a593Smuzhiyun
79*4882a593Smuzhiyun log_debug(ls, "skip %x add bast %llu mode %d "
80*4882a593Smuzhiyun "for bast %llu mode %d",
81*4882a593Smuzhiyun lkb->lkb_id,
82*4882a593Smuzhiyun (unsigned long long)seq,
83*4882a593Smuzhiyun mode,
84*4882a593Smuzhiyun (unsigned long long)prev_seq,
85*4882a593Smuzhiyun prev_mode);
86*4882a593Smuzhiyun rv = 0;
87*4882a593Smuzhiyun goto out;
88*4882a593Smuzhiyun }
89*4882a593Smuzhiyun }
90*4882a593Smuzhiyun
91*4882a593Smuzhiyun lkb->lkb_callbacks[i].seq = seq;
92*4882a593Smuzhiyun lkb->lkb_callbacks[i].flags = flags;
93*4882a593Smuzhiyun lkb->lkb_callbacks[i].mode = mode;
94*4882a593Smuzhiyun lkb->lkb_callbacks[i].sb_status = status;
95*4882a593Smuzhiyun lkb->lkb_callbacks[i].sb_flags = (sbflags & 0x000000FF);
96*4882a593Smuzhiyun rv = 0;
97*4882a593Smuzhiyun break;
98*4882a593Smuzhiyun }
99*4882a593Smuzhiyun
100*4882a593Smuzhiyun if (i == DLM_CALLBACKS_SIZE) {
101*4882a593Smuzhiyun log_error(ls, "no callbacks %x %llu flags %x mode %d sb %d %x",
102*4882a593Smuzhiyun lkb->lkb_id, (unsigned long long)seq,
103*4882a593Smuzhiyun flags, mode, status, sbflags);
104*4882a593Smuzhiyun dlm_dump_lkb_callbacks(lkb);
105*4882a593Smuzhiyun rv = -1;
106*4882a593Smuzhiyun goto out;
107*4882a593Smuzhiyun }
108*4882a593Smuzhiyun out:
109*4882a593Smuzhiyun return rv;
110*4882a593Smuzhiyun }
111*4882a593Smuzhiyun
dlm_rem_lkb_callback(struct dlm_ls * ls,struct dlm_lkb * lkb,struct dlm_callback * cb,int * resid)112*4882a593Smuzhiyun int dlm_rem_lkb_callback(struct dlm_ls *ls, struct dlm_lkb *lkb,
113*4882a593Smuzhiyun struct dlm_callback *cb, int *resid)
114*4882a593Smuzhiyun {
115*4882a593Smuzhiyun int i, rv;
116*4882a593Smuzhiyun
117*4882a593Smuzhiyun *resid = 0;
118*4882a593Smuzhiyun
119*4882a593Smuzhiyun if (!lkb->lkb_callbacks[0].seq) {
120*4882a593Smuzhiyun rv = -ENOENT;
121*4882a593Smuzhiyun goto out;
122*4882a593Smuzhiyun }
123*4882a593Smuzhiyun
124*4882a593Smuzhiyun /* oldest undelivered cb is callbacks[0] */
125*4882a593Smuzhiyun
126*4882a593Smuzhiyun memcpy(cb, &lkb->lkb_callbacks[0], sizeof(struct dlm_callback));
127*4882a593Smuzhiyun memset(&lkb->lkb_callbacks[0], 0, sizeof(struct dlm_callback));
128*4882a593Smuzhiyun
129*4882a593Smuzhiyun /* shift others down */
130*4882a593Smuzhiyun
131*4882a593Smuzhiyun for (i = 1; i < DLM_CALLBACKS_SIZE; i++) {
132*4882a593Smuzhiyun if (!lkb->lkb_callbacks[i].seq)
133*4882a593Smuzhiyun break;
134*4882a593Smuzhiyun memcpy(&lkb->lkb_callbacks[i-1], &lkb->lkb_callbacks[i],
135*4882a593Smuzhiyun sizeof(struct dlm_callback));
136*4882a593Smuzhiyun memset(&lkb->lkb_callbacks[i], 0, sizeof(struct dlm_callback));
137*4882a593Smuzhiyun (*resid)++;
138*4882a593Smuzhiyun }
139*4882a593Smuzhiyun
140*4882a593Smuzhiyun /* if cb is a bast, it should be skipped if the blocking mode is
141*4882a593Smuzhiyun compatible with the last granted mode */
142*4882a593Smuzhiyun
143*4882a593Smuzhiyun if ((cb->flags & DLM_CB_BAST) && lkb->lkb_last_cast.seq) {
144*4882a593Smuzhiyun if (dlm_modes_compat(cb->mode, lkb->lkb_last_cast.mode)) {
145*4882a593Smuzhiyun cb->flags |= DLM_CB_SKIP;
146*4882a593Smuzhiyun
147*4882a593Smuzhiyun log_debug(ls, "skip %x bast %llu mode %d "
148*4882a593Smuzhiyun "for cast %llu mode %d",
149*4882a593Smuzhiyun lkb->lkb_id,
150*4882a593Smuzhiyun (unsigned long long)cb->seq,
151*4882a593Smuzhiyun cb->mode,
152*4882a593Smuzhiyun (unsigned long long)lkb->lkb_last_cast.seq,
153*4882a593Smuzhiyun lkb->lkb_last_cast.mode);
154*4882a593Smuzhiyun rv = 0;
155*4882a593Smuzhiyun goto out;
156*4882a593Smuzhiyun }
157*4882a593Smuzhiyun }
158*4882a593Smuzhiyun
159*4882a593Smuzhiyun if (cb->flags & DLM_CB_CAST) {
160*4882a593Smuzhiyun memcpy(&lkb->lkb_last_cast, cb, sizeof(struct dlm_callback));
161*4882a593Smuzhiyun lkb->lkb_last_cast_time = ktime_get();
162*4882a593Smuzhiyun }
163*4882a593Smuzhiyun
164*4882a593Smuzhiyun if (cb->flags & DLM_CB_BAST) {
165*4882a593Smuzhiyun memcpy(&lkb->lkb_last_bast, cb, sizeof(struct dlm_callback));
166*4882a593Smuzhiyun lkb->lkb_last_bast_time = ktime_get();
167*4882a593Smuzhiyun }
168*4882a593Smuzhiyun rv = 0;
169*4882a593Smuzhiyun out:
170*4882a593Smuzhiyun return rv;
171*4882a593Smuzhiyun }
172*4882a593Smuzhiyun
dlm_add_cb(struct dlm_lkb * lkb,uint32_t flags,int mode,int status,uint32_t sbflags)173*4882a593Smuzhiyun void dlm_add_cb(struct dlm_lkb *lkb, uint32_t flags, int mode, int status,
174*4882a593Smuzhiyun uint32_t sbflags)
175*4882a593Smuzhiyun {
176*4882a593Smuzhiyun struct dlm_ls *ls = lkb->lkb_resource->res_ls;
177*4882a593Smuzhiyun uint64_t new_seq, prev_seq;
178*4882a593Smuzhiyun int rv;
179*4882a593Smuzhiyun
180*4882a593Smuzhiyun spin_lock(&dlm_cb_seq_spin);
181*4882a593Smuzhiyun new_seq = ++dlm_cb_seq;
182*4882a593Smuzhiyun if (!dlm_cb_seq)
183*4882a593Smuzhiyun new_seq = ++dlm_cb_seq;
184*4882a593Smuzhiyun spin_unlock(&dlm_cb_seq_spin);
185*4882a593Smuzhiyun
186*4882a593Smuzhiyun if (lkb->lkb_flags & DLM_IFL_USER) {
187*4882a593Smuzhiyun dlm_user_add_ast(lkb, flags, mode, status, sbflags, new_seq);
188*4882a593Smuzhiyun return;
189*4882a593Smuzhiyun }
190*4882a593Smuzhiyun
191*4882a593Smuzhiyun mutex_lock(&lkb->lkb_cb_mutex);
192*4882a593Smuzhiyun prev_seq = lkb->lkb_callbacks[0].seq;
193*4882a593Smuzhiyun
194*4882a593Smuzhiyun rv = dlm_add_lkb_callback(lkb, flags, mode, status, sbflags, new_seq);
195*4882a593Smuzhiyun if (rv < 0)
196*4882a593Smuzhiyun goto out;
197*4882a593Smuzhiyun
198*4882a593Smuzhiyun if (!prev_seq) {
199*4882a593Smuzhiyun kref_get(&lkb->lkb_ref);
200*4882a593Smuzhiyun
201*4882a593Smuzhiyun mutex_lock(&ls->ls_cb_mutex);
202*4882a593Smuzhiyun if (test_bit(LSFL_CB_DELAY, &ls->ls_flags)) {
203*4882a593Smuzhiyun list_add(&lkb->lkb_cb_list, &ls->ls_cb_delay);
204*4882a593Smuzhiyun } else {
205*4882a593Smuzhiyun queue_work(ls->ls_callback_wq, &lkb->lkb_cb_work);
206*4882a593Smuzhiyun }
207*4882a593Smuzhiyun mutex_unlock(&ls->ls_cb_mutex);
208*4882a593Smuzhiyun }
209*4882a593Smuzhiyun out:
210*4882a593Smuzhiyun mutex_unlock(&lkb->lkb_cb_mutex);
211*4882a593Smuzhiyun }
212*4882a593Smuzhiyun
dlm_callback_work(struct work_struct * work)213*4882a593Smuzhiyun void dlm_callback_work(struct work_struct *work)
214*4882a593Smuzhiyun {
215*4882a593Smuzhiyun struct dlm_lkb *lkb = container_of(work, struct dlm_lkb, lkb_cb_work);
216*4882a593Smuzhiyun struct dlm_ls *ls = lkb->lkb_resource->res_ls;
217*4882a593Smuzhiyun void (*castfn) (void *astparam);
218*4882a593Smuzhiyun void (*bastfn) (void *astparam, int mode);
219*4882a593Smuzhiyun struct dlm_callback callbacks[DLM_CALLBACKS_SIZE];
220*4882a593Smuzhiyun int i, rv, resid;
221*4882a593Smuzhiyun
222*4882a593Smuzhiyun memset(&callbacks, 0, sizeof(callbacks));
223*4882a593Smuzhiyun
224*4882a593Smuzhiyun mutex_lock(&lkb->lkb_cb_mutex);
225*4882a593Smuzhiyun if (!lkb->lkb_callbacks[0].seq) {
226*4882a593Smuzhiyun /* no callback work exists, shouldn't happen */
227*4882a593Smuzhiyun log_error(ls, "dlm_callback_work %x no work", lkb->lkb_id);
228*4882a593Smuzhiyun dlm_print_lkb(lkb);
229*4882a593Smuzhiyun dlm_dump_lkb_callbacks(lkb);
230*4882a593Smuzhiyun }
231*4882a593Smuzhiyun
232*4882a593Smuzhiyun for (i = 0; i < DLM_CALLBACKS_SIZE; i++) {
233*4882a593Smuzhiyun rv = dlm_rem_lkb_callback(ls, lkb, &callbacks[i], &resid);
234*4882a593Smuzhiyun if (rv < 0)
235*4882a593Smuzhiyun break;
236*4882a593Smuzhiyun }
237*4882a593Smuzhiyun
238*4882a593Smuzhiyun if (resid) {
239*4882a593Smuzhiyun /* cbs remain, loop should have removed all, shouldn't happen */
240*4882a593Smuzhiyun log_error(ls, "dlm_callback_work %x resid %d", lkb->lkb_id,
241*4882a593Smuzhiyun resid);
242*4882a593Smuzhiyun dlm_print_lkb(lkb);
243*4882a593Smuzhiyun dlm_dump_lkb_callbacks(lkb);
244*4882a593Smuzhiyun }
245*4882a593Smuzhiyun mutex_unlock(&lkb->lkb_cb_mutex);
246*4882a593Smuzhiyun
247*4882a593Smuzhiyun castfn = lkb->lkb_astfn;
248*4882a593Smuzhiyun bastfn = lkb->lkb_bastfn;
249*4882a593Smuzhiyun
250*4882a593Smuzhiyun for (i = 0; i < DLM_CALLBACKS_SIZE; i++) {
251*4882a593Smuzhiyun if (!callbacks[i].seq)
252*4882a593Smuzhiyun break;
253*4882a593Smuzhiyun if (callbacks[i].flags & DLM_CB_SKIP) {
254*4882a593Smuzhiyun continue;
255*4882a593Smuzhiyun } else if (callbacks[i].flags & DLM_CB_BAST) {
256*4882a593Smuzhiyun bastfn(lkb->lkb_astparam, callbacks[i].mode);
257*4882a593Smuzhiyun } else if (callbacks[i].flags & DLM_CB_CAST) {
258*4882a593Smuzhiyun lkb->lkb_lksb->sb_status = callbacks[i].sb_status;
259*4882a593Smuzhiyun lkb->lkb_lksb->sb_flags = callbacks[i].sb_flags;
260*4882a593Smuzhiyun castfn(lkb->lkb_astparam);
261*4882a593Smuzhiyun }
262*4882a593Smuzhiyun }
263*4882a593Smuzhiyun
264*4882a593Smuzhiyun /* undo kref_get from dlm_add_callback, may cause lkb to be freed */
265*4882a593Smuzhiyun dlm_put_lkb(lkb);
266*4882a593Smuzhiyun }
267*4882a593Smuzhiyun
dlm_callback_start(struct dlm_ls * ls)268*4882a593Smuzhiyun int dlm_callback_start(struct dlm_ls *ls)
269*4882a593Smuzhiyun {
270*4882a593Smuzhiyun ls->ls_callback_wq = alloc_workqueue("dlm_callback",
271*4882a593Smuzhiyun WQ_HIGHPRI | WQ_MEM_RECLAIM, 0);
272*4882a593Smuzhiyun if (!ls->ls_callback_wq) {
273*4882a593Smuzhiyun log_print("can't start dlm_callback workqueue");
274*4882a593Smuzhiyun return -ENOMEM;
275*4882a593Smuzhiyun }
276*4882a593Smuzhiyun return 0;
277*4882a593Smuzhiyun }
278*4882a593Smuzhiyun
dlm_callback_stop(struct dlm_ls * ls)279*4882a593Smuzhiyun void dlm_callback_stop(struct dlm_ls *ls)
280*4882a593Smuzhiyun {
281*4882a593Smuzhiyun if (ls->ls_callback_wq)
282*4882a593Smuzhiyun destroy_workqueue(ls->ls_callback_wq);
283*4882a593Smuzhiyun }
284*4882a593Smuzhiyun
dlm_callback_suspend(struct dlm_ls * ls)285*4882a593Smuzhiyun void dlm_callback_suspend(struct dlm_ls *ls)
286*4882a593Smuzhiyun {
287*4882a593Smuzhiyun mutex_lock(&ls->ls_cb_mutex);
288*4882a593Smuzhiyun set_bit(LSFL_CB_DELAY, &ls->ls_flags);
289*4882a593Smuzhiyun mutex_unlock(&ls->ls_cb_mutex);
290*4882a593Smuzhiyun
291*4882a593Smuzhiyun if (ls->ls_callback_wq)
292*4882a593Smuzhiyun flush_workqueue(ls->ls_callback_wq);
293*4882a593Smuzhiyun }
294*4882a593Smuzhiyun
295*4882a593Smuzhiyun #define MAX_CB_QUEUE 25
296*4882a593Smuzhiyun
dlm_callback_resume(struct dlm_ls * ls)297*4882a593Smuzhiyun void dlm_callback_resume(struct dlm_ls *ls)
298*4882a593Smuzhiyun {
299*4882a593Smuzhiyun struct dlm_lkb *lkb, *safe;
300*4882a593Smuzhiyun int count = 0;
301*4882a593Smuzhiyun
302*4882a593Smuzhiyun clear_bit(LSFL_CB_DELAY, &ls->ls_flags);
303*4882a593Smuzhiyun
304*4882a593Smuzhiyun if (!ls->ls_callback_wq)
305*4882a593Smuzhiyun return;
306*4882a593Smuzhiyun
307*4882a593Smuzhiyun more:
308*4882a593Smuzhiyun mutex_lock(&ls->ls_cb_mutex);
309*4882a593Smuzhiyun list_for_each_entry_safe(lkb, safe, &ls->ls_cb_delay, lkb_cb_list) {
310*4882a593Smuzhiyun list_del_init(&lkb->lkb_cb_list);
311*4882a593Smuzhiyun queue_work(ls->ls_callback_wq, &lkb->lkb_cb_work);
312*4882a593Smuzhiyun count++;
313*4882a593Smuzhiyun if (count == MAX_CB_QUEUE)
314*4882a593Smuzhiyun break;
315*4882a593Smuzhiyun }
316*4882a593Smuzhiyun mutex_unlock(&ls->ls_cb_mutex);
317*4882a593Smuzhiyun
318*4882a593Smuzhiyun if (count)
319*4882a593Smuzhiyun log_rinfo(ls, "dlm_callback_resume %d", count);
320*4882a593Smuzhiyun if (count == MAX_CB_QUEUE) {
321*4882a593Smuzhiyun count = 0;
322*4882a593Smuzhiyun cond_resched();
323*4882a593Smuzhiyun goto more;
324*4882a593Smuzhiyun }
325*4882a593Smuzhiyun }
326*4882a593Smuzhiyun
327